{ "schemaVersion": 1, "deviceProperties": [ { "id": 0, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 1, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 2, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 3, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 4, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 5, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 6, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 7, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 } ], "cupti_version": 22, "cuda_runtime_version": 12040, "cuda_driver_version": 12080, "distributedInfo": {"backend": "nccl", "rank": 4, "world_size": 8, "pg_count": 1, "pg_config": [{"pg_name": "0", "pg_desc": "default_pg", "backend_config": "cuda:nccl", "pg_size": 8, "ranks": [0, 1, 2, 3, 4, 5, 6, 7]}], "nccl_version": "2.21.5"}, "record_shapes": 1, "trace_id": "8ED2348FCF624EB3A9FD0F0CA72D7F2A", "traceEvents": [ { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: DivBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650727367.218, "dur": 117.307, "args": { "External id": 17409,"Record function id": 0, "Sequence number": 246770, "Fwd thread id": 1, "Ev Idx": 0 } }, { "ph": "X", "cat": "cpu_op", "name": "DivBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650727388.315, "dur": 86.614, "args": { "External id": 17410,"Sequence number": 246770, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 1 } }, { "ph": "f", "id": 1, "pid": 1336757, "tid": 1381170, "ts": 1295650727388.315, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336757, "tid": 1381170, "ts": 1295650727396.199, "dur": 76.630, "args": { "External id": 17411,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 2 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650727500.085, "dur": 198.234, "args": { "External id": 17412,"Record function id": 0, "Ev Idx": 3 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650727552.468, "dur": 79.642, "args": { "External id": 17413,"Record function id": 0, "Ev Idx": 4 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.27", "pid": 1336757, "tid": 1381170, "ts": 1295650727580.247, "dur": 40.295, "args": { "External id": 17414,"Record function id": 0, "Ev Idx": 5 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650727637.026, "dur": 1.807, "args": { "External id": 17415,"Sequence number": 246769, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 6 } }, { "ph": "f", "id": 2, "pid": 1336757, "tid": 1381170, "ts": 1295650727637.026, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650727642.419, "dur": 51.820, "args": { "External id": 17416,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 7 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650727651.940, "dur": 41.764, "args": { "External id": 17417,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 8 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650727661.271, "dur": 2.241, "args": { "External id": 17418,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650727706.960, "dur": 35564.147, "args": { "External id": 17419,"Record function id": 0, "Sequence number": 246767, "Fwd thread id": 1, "Ev Idx": 10 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650727709.084, "dur": 35549.441, "args": { "External id": 17420,"Sequence number": 246767, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11 } }, { "ph": "f", "id": 3, "pid": 1336757, "tid": 1381170, "ts": 1295650727709.084, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650727748.494, "dur": 3.545, "args": { "External id": 17421,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 12 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650727754.993, "dur": 35373.987, "args": { "External id": 17422,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 13 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650727759.314, "dur": 35369.187, "args": { "External id": 17423,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 14 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650727764.097, "dur": 7.031, "args": { "External id": 17424,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 15 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650727772.884, "dur": 35353.679, "args": { "External id": 17425,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 16 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336757, "tid": 1381170, "ts": 1295650763134.905, "dur": 0.571, "args": { "External id": 17426,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 17 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336757, "tid": 1381170, "ts": 1295650763137.574, "dur": 3.440, "args": { "External id": 17427,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 18 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336757, "tid": 1381170, "ts": 1295650763139.737, "dur": 1.022, "args": { "External id": 17428,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 19 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336757, "tid": 1381170, "ts": 1295650763147.783, "dur": 35.076, "args": { "External id": 17429,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 20 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336757, "tid": 1381170, "ts": 1295650763190.649, "dur": 56.649, "args": { "External id": 17430,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 21 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336757, "tid": 1381170, "ts": 1295650763192.149, "dur": 54.885, "args": { "External id": 17431,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 22 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336757, "tid": 1381170, "ts": 1295650763193.916, "dur": 52.419, "args": { "External id": 17432,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 23 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763283.180, "dur": 16.765, "args": { "External id": 17433,"Record function id": 0, "Sequence number": 246766, "Fwd thread id": 1, "Ev Idx": 24 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763285.196, "dur": 12.141, "args": { "External id": 17434,"Sequence number": 246766, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 25 } }, { "ph": "f", "id": 4, "pid": 1336757, "tid": 1381170, "ts": 1295650763285.196, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650763289.641, "dur": 7.465, "args": { "External id": 17435,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 26 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650763291.635, "dur": 5.232, "args": { "External id": 17436,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 27 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763303.846, "dur": 98.620, "args": { "External id": 17437,"Record function id": 0, "Sequence number": 246765, "Fwd thread id": 1, "Ev Idx": 28 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763304.685, "dur": 90.549, "args": { "External id": 17438,"Sequence number": 246765, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 29 } }, { "ph": "f", "id": 5, "pid": 1336757, "tid": 1381170, "ts": 1295650763304.685, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650763307.698, "dur": 87.001, "args": { "External id": 17439,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 30 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650763314.264, "dur": 36.226, "args": { "External id": 17440,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 31 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650763316.826, "dur": 4.862, "args": { "External id": 17441,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 32 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650763323.523, "dur": 26.668, "args": { "External id": 17442,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 33 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650763328.322, "dur": 21.401, "args": { "External id": 17443,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 34 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650763353.128, "dur": 6.127, "args": { "External id": 17444,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 35 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650763357.169, "dur": 1.716, "args": { "External id": 17445,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 36 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650763360.262, "dur": 33.505, "args": { "External id": 17446,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 37 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763406.559, "dur": 62.108, "args": { "External id": 17447,"Record function id": 0, "Sequence number": 246764, "Fwd thread id": 1, "Ev Idx": 38 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763407.389, "dur": 57.980, "args": { "External id": 17448,"Sequence number": 246764, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 39 } }, { "ph": "f", "id": 6, "pid": 1336757, "tid": 1381170, "ts": 1295650763407.389, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650763411.545, "dur": 53.596, "args": { "External id": 17449,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "3"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 40 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650763414.855, "dur": 19.268, "args": { "External id": 17450,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 41 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650763416.110, "dur": 2.721, "args": { "External id": 17451,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 42 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650763419.480, "dur": 14.391, "args": { "External id": 17452,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 43 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650763420.484, "dur": 12.907, "args": { "External id": 17453,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 44 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1381170, "ts": 1295650763438.473, "dur": 6.346, "args": { "External id": 17454,"Record function id": 0, "Concrete Inputs": ["", "2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 45 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650763443.093, "dur": 1.010, "args": { "External id": 17455,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 46 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650763445.717, "dur": 18.941, "args": { "External id": 17456,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 47 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763472.688, "dur": 122.307, "args": { "External id": 17457,"Record function id": 0, "Sequence number": 246763, "Fwd thread id": 1, "Ev Idx": 48 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763473.673, "dur": 117.924, "args": { "External id": 17458,"Sequence number": 246763, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 49 } }, { "ph": "f", "id": 7, "pid": 1336757, "tid": 1381170, "ts": 1295650763473.673, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650763475.894, "dur": 115.354, "args": { "External id": 17459,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 50 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650763479.412, "dur": 17.135, "args": { "External id": 17460,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 51 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650763480.522, "dur": 1.906, "args": { "External id": 17461,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 52 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650763483.214, "dur": 13.073, "args": { "External id": 17462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 53 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650763484.002, "dur": 11.883, "args": { "External id": 17463,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 54 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650763499.724, "dur": 2.917, "args": { "External id": 17464,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 55 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650763501.768, "dur": 0.675, "args": { "External id": 17465,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 56 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650763503.314, "dur": 87.116, "args": { "External id": 17466,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 57 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763601.383, "dur": 94.786, "args": { "External id": 17467,"Record function id": 0, "Sequence number": 246762, "Fwd thread id": 1, "Ev Idx": 58 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763602.427, "dur": 90.610, "args": { "External id": 17468,"Sequence number": 246762, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 59 } }, { "ph": "f", "id": 8, "pid": 1336757, "tid": 1381170, "ts": 1295650763602.427, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650763604.164, "dur": 88.538, "args": { "External id": 17469,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 60 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650763605.681, "dur": 21.072, "args": { "External id": 17470,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 61 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650763606.879, "dur": 4.446, "args": { "External id": 17471,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 62 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650763612.478, "dur": 14.016, "args": { "External id": 17472,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 63 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650763613.137, "dur": 12.998, "args": { "External id": 17473,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 64 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650763630.165, "dur": 5.129, "args": { "External id": 17474,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 65 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650763634.671, "dur": 0.420, "args": { "External id": 17475,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 66 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650763635.929, "dur": 56.158, "args": { "External id": 17476,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 67 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763700.463, "dur": 35.008, "args": { "External id": 17477,"Record function id": 0, "Sequence number": 246761, "Fwd thread id": 1, "Ev Idx": 68 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650763701.586, "dur": 0.948, "args": { "External id": 17478,"Sequence number": 246761, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 69 } }, { "ph": "f", "id": 9, "pid": 1336757, "tid": 1381170, "ts": 1295650763701.586, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650763705.206, "dur": 27.339, "args": { "External id": 17479,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 70 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650763707.416, "dur": 24.680, "args": { "External id": 17480,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 71 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650763713.245, "dur": 0.503, "args": { "External id": 17481,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 72 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650763740.579, "dur": 2310.567, "args": { "External id": 17482,"Record function id": 0, "Sequence number": 246759, "Fwd thread id": 1, "Ev Idx": 73 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650763742.060, "dur": 2274.865, "args": { "External id": 17483,"Sequence number": 246759, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 74 } }, { "ph": "f", "id": 10, "pid": 1336757, "tid": 1381170, "ts": 1295650763742.060, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650763778.563, "dur": 2.857, "args": { "External id": 17484,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 75 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650763783.818, "dur": 2116.520, "args": { "External id": 17485,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 76 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650763785.691, "dur": 2114.315, "args": { "External id": 17486,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 77 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650763788.939, "dur": 3.618, "args": { "External id": 17487,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 78 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650763795.907, "dur": 2103.140, "args": { "External id": 17488,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 79 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336757, "tid": 1381170, "ts": 1295650765903.918, "dur": 0.305, "args": { "External id": 17489,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 80 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336757, "tid": 1381170, "ts": 1295650765905.654, "dur": 2.657, "args": { "External id": 17490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 81 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336757, "tid": 1381170, "ts": 1295650765907.298, "dur": 0.885, "args": { "External id": 17491,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 82 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336757, "tid": 1381170, "ts": 1295650765912.796, "dur": 23.326, "args": { "External id": 17492,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 83 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336757, "tid": 1381170, "ts": 1295650765941.695, "dur": 66.213, "args": { "External id": 17493,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 84 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336757, "tid": 1381170, "ts": 1295650765943.056, "dur": 64.621, "args": { "External id": 17494,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 85 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336757, "tid": 1381170, "ts": 1295650765944.403, "dur": 62.569, "args": { "External id": 17495,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 86 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650766026.727, "dur": 21.328, "args": { "External id": 17496,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 87 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766058.770, "dur": 14.376, "args": { "External id": 17497,"Record function id": 0, "Sequence number": 246758, "Fwd thread id": 1, "Ev Idx": 88 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766062.432, "dur": 8.229, "args": { "External id": 17498,"Sequence number": 246758, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 89 } }, { "ph": "f", "id": 11, "pid": 1336757, "tid": 1381170, "ts": 1295650766062.432, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650766064.968, "dur": 5.490, "args": { "External id": 17499,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 90 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650766066.408, "dur": 3.920, "args": { "External id": 17500,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 91 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766076.392, "dur": 70.715, "args": { "External id": 17501,"Record function id": 0, "Sequence number": 246757, "Fwd thread id": 1, "Ev Idx": 92 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766077.748, "dur": 64.917, "args": { "External id": 17502,"Sequence number": 246757, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 93 } }, { "ph": "f", "id": 12, "pid": 1336757, "tid": 1381170, "ts": 1295650766077.748, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650766080.148, "dur": 62.137, "args": { "External id": 17503,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 94 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650766082.450, "dur": 23.215, "args": { "External id": 17504,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 95 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650766084.474, "dur": 3.074, "args": { "External id": 17505,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 96 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650766088.473, "dur": 16.919, "args": { "External id": 17506,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 97 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650766089.580, "dur": 15.424, "args": { "External id": 17507,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 98 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650766107.360, "dur": 6.320, "args": { "External id": 17508,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 99 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650766110.263, "dur": 3.086, "args": { "External id": 17509,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650766117.255, "dur": 24.283, "args": { "External id": 17510,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 101 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766150.817, "dur": 53.754, "args": { "External id": 17511,"Record function id": 0, "Sequence number": 246756, "Fwd thread id": 1, "Ev Idx": 102 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766151.882, "dur": 48.979, "args": { "External id": 17512,"Sequence number": 246756, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 103 } }, { "ph": "f", "id": 13, "pid": 1336757, "tid": 1381170, "ts": 1295650766151.882, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650766154.508, "dur": 46.121, "args": { "External id": 17513,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "2"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650766156.253, "dur": 18.823, "args": { "External id": 17514,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650766157.172, "dur": 2.061, "args": { "External id": 17515,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650766159.857, "dur": 14.947, "args": { "External id": 17516,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650766160.930, "dur": 13.493, "args": { "External id": 17517,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1381170, "ts": 1295650766176.456, "dur": 7.819, "args": { "External id": 17518,"Record function id": 0, "Concrete Inputs": ["", "2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650766182.764, "dur": 0.877, "args": { "External id": 17519,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650766185.029, "dur": 15.180, "args": { "External id": 17520,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 111 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766208.282, "dur": 106.525, "args": { "External id": 17521,"Record function id": 0, "Sequence number": 246755, "Fwd thread id": 1, "Ev Idx": 112 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766209.138, "dur": 101.978, "args": { "External id": 17522,"Sequence number": 246755, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 113 } }, { "ph": "f", "id": 14, "pid": 1336757, "tid": 1381170, "ts": 1295650766209.138, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650766210.911, "dur": 99.843, "args": { "External id": 17523,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650766212.127, "dur": 15.011, "args": { "External id": 17524,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650766213.062, "dur": 1.838, "args": { "External id": 17525,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650766215.620, "dur": 11.276, "args": { "External id": 17526,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650766216.307, "dur": 10.246, "args": { "External id": 17527,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650766239.668, "dur": 6.128, "args": { "External id": 17528,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650766244.582, "dur": 0.789, "args": { "External id": 17529,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650766246.525, "dur": 63.351, "args": { "External id": 17530,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 121 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766321.813, "dur": 96.419, "args": { "External id": 17531,"Record function id": 0, "Sequence number": 246754, "Fwd thread id": 1, "Ev Idx": 122 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766322.941, "dur": 75.828, "args": { "External id": 17532,"Sequence number": 246754, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 123 } }, { "ph": "f", "id": 15, "pid": 1336757, "tid": 1381170, "ts": 1295650766322.941, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650766324.476, "dur": 74.041, "args": { "External id": 17533,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650766326.201, "dur": 16.479, "args": { "External id": 17534,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650766327.179, "dur": 2.260, "args": { "External id": 17535,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650766330.194, "dur": 12.218, "args": { "External id": 17536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650766330.992, "dur": 11.048, "args": { "External id": 17537,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650766343.823, "dur": 2.694, "args": { "External id": 17538,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650766345.709, "dur": 0.615, "args": { "External id": 17539,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650766347.317, "dur": 50.598, "args": { "External id": 17540,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650766402.546, "dur": 14.320, "args": { "External id": 17541,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 132 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766424.162, "dur": 33.447, "args": { "External id": 17542,"Record function id": 0, "Sequence number": 246753, "Fwd thread id": 1, "Ev Idx": 133 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650766425.330, "dur": 1.044, "args": { "External id": 17543,"Sequence number": 246753, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 134 } }, { "ph": "f", "id": 16, "pid": 1336757, "tid": 1381170, "ts": 1295650766425.330, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650766428.408, "dur": 26.392, "args": { "External id": 17544,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650766430.299, "dur": 24.040, "args": { "External id": 17545,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650766435.269, "dur": 2.928, "args": { "External id": 17546,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 137 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650766462.037, "dur": 3084.103, "args": { "External id": 17547,"Record function id": 0, "Sequence number": 246751, "Fwd thread id": 1, "Ev Idx": 138 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650766466.115, "dur": 3055.357, "args": { "External id": 17548,"Sequence number": 246751, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 139 } }, { "ph": "f", "id": 17, "pid": 1336757, "tid": 1381170, "ts": 1295650766466.115, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650766495.606, "dur": 2.401, "args": { "External id": 17549,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650766500.178, "dur": 2934.059, "args": { "External id": 17550,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650766501.548, "dur": 2932.359, "args": { "External id": 17551,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650766504.282, "dur": 3.034, "args": { "External id": 17552,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650766507.972, "dur": 2925.171, "args": { "External id": 17553,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336757, "tid": 1381170, "ts": 1295650769437.988, "dur": 0.250, "args": { "External id": 17554,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336757, "tid": 1381170, "ts": 1295650769439.629, "dur": 5.396, "args": { "External id": 17555,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 146 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336757, "tid": 1381170, "ts": 1295650769444.087, "dur": 0.763, "args": { "External id": 17556,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336757, "tid": 1381170, "ts": 1295650769448.987, "dur": 21.889, "args": { "External id": 17557,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336757, "tid": 1381170, "ts": 1295650769476.496, "dur": 37.886, "args": { "External id": 17558,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336757, "tid": 1381170, "ts": 1295650769477.801, "dur": 36.413, "args": { "External id": 17559,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336757, "tid": 1381170, "ts": 1295650769479.348, "dur": 34.503, "args": { "External id": 17560,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650769528.542, "dur": 14.858, "args": { "External id": 17561,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 152 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769556.273, "dur": 10.193, "args": { "External id": 17562,"Record function id": 0, "Sequence number": 246750, "Fwd thread id": 1, "Ev Idx": 153 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769557.441, "dur": 7.150, "args": { "External id": 17563,"Sequence number": 246750, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 154 } }, { "ph": "f", "id": 18, "pid": 1336757, "tid": 1381170, "ts": 1295650769557.441, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650769559.948, "dur": 4.443, "args": { "External id": 17564,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650769561.398, "dur": 2.878, "args": { "External id": 17565,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 156 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769569.760, "dur": 59.446, "args": { "External id": 17566,"Record function id": 0, "Sequence number": 246749, "Fwd thread id": 1, "Ev Idx": 157 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769573.504, "dur": 51.982, "args": { "External id": 17567,"Sequence number": 246749, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 158 } }, { "ph": "f", "id": 19, "pid": 1336757, "tid": 1381170, "ts": 1295650769573.504, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650769575.256, "dur": 49.872, "args": { "External id": 17568,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650769577.722, "dur": 19.943, "args": { "External id": 17569,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650769579.352, "dur": 2.169, "args": { "External id": 17570,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650769582.166, "dur": 15.228, "args": { "External id": 17571,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650769583.535, "dur": 13.361, "args": { "External id": 17572,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650769598.856, "dur": 3.526, "args": { "External id": 17573,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650769601.484, "dur": 0.629, "args": { "External id": 17574,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650769603.180, "dur": 21.150, "args": { "External id": 17575,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 166 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769633.267, "dur": 55.327, "args": { "External id": 17576,"Record function id": 0, "Sequence number": 246748, "Fwd thread id": 1, "Ev Idx": 167 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769634.142, "dur": 52.137, "args": { "External id": 17577,"Sequence number": 246748, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 168 } }, { "ph": "f", "id": 20, "pid": 1336757, "tid": 1381170, "ts": 1295650769634.142, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650769635.997, "dur": 50.037, "args": { "External id": 17578,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650769640.365, "dur": 21.299, "args": { "External id": 17579,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650769641.208, "dur": 2.285, "args": { "External id": 17580,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650769644.057, "dur": 17.339, "args": { "External id": 17581,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650769645.079, "dur": 15.829, "args": { "External id": 17582,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1381170, "ts": 1295650769662.664, "dur": 6.788, "args": { "External id": 17583,"Record function id": 0, "Concrete Inputs": ["", "2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650769667.199, "dur": 1.679, "args": { "External id": 17584,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650769670.112, "dur": 15.429, "args": { "External id": 17585,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 176 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769692.349, "dur": 93.098, "args": { "External id": 17586,"Record function id": 0, "Sequence number": 246747, "Fwd thread id": 1, "Ev Idx": 177 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769693.480, "dur": 89.420, "args": { "External id": 17587,"Sequence number": 246747, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 178 } }, { "ph": "f", "id": 21, "pid": 1336757, "tid": 1381170, "ts": 1295650769693.480, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650769695.165, "dur": 87.318, "args": { "External id": 17588,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650769696.180, "dur": 18.613, "args": { "External id": 17589,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650769699.530, "dur": 1.859, "args": { "External id": 17590,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650769701.924, "dur": 12.614, "args": { "External id": 17591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650769702.549, "dur": 11.534, "args": { "External id": 17592,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650769715.641, "dur": 3.208, "args": { "External id": 17593,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650769717.959, "dur": 0.684, "args": { "External id": 17594,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650769719.495, "dur": 62.211, "args": { "External id": 17595,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 186 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769789.005, "dur": 93.857, "args": { "External id": 17596,"Record function id": 0, "Sequence number": 246746, "Fwd thread id": 1, "Ev Idx": 187 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769790.186, "dur": 75.578, "args": { "External id": 17597,"Sequence number": 246746, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 188 } }, { "ph": "f", "id": 22, "pid": 1336757, "tid": 1381170, "ts": 1295650769790.186, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650769793.893, "dur": 71.520, "args": { "External id": 17598,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650769795.139, "dur": 16.737, "args": { "External id": 17599,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650769797.966, "dur": 1.728, "args": { "External id": 17600,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650769800.119, "dur": 11.509, "args": { "External id": 17601,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650769800.937, "dur": 10.326, "args": { "External id": 17602,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650769812.529, "dur": 2.808, "args": { "External id": 17603,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650769814.523, "dur": 0.562, "args": { "External id": 17604,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650769816.027, "dur": 48.775, "args": { "External id": 17605,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650769868.598, "dur": 13.215, "args": { "External id": 17606,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 197 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769886.695, "dur": 30.523, "args": { "External id": 17607,"Record function id": 0, "Sequence number": 246745, "Fwd thread id": 1, "Ev Idx": 198 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650769887.957, "dur": 0.921, "args": { "External id": 17608,"Sequence number": 246745, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 199 } }, { "ph": "f", "id": 23, "pid": 1336757, "tid": 1381170, "ts": 1295650769887.957, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650769890.592, "dur": 23.187, "args": { "External id": 17609,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650769892.424, "dur": 20.941, "args": { "External id": 17610,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650769896.851, "dur": 0.590, "args": { "External id": 17611,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 202 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650769921.251, "dur": 3147.552, "args": { "External id": 17612,"Record function id": 0, "Sequence number": 246744, "Fwd thread id": 1, "Ev Idx": 203 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650769931.495, "dur": 3106.315, "args": { "External id": 17613,"Sequence number": 246744, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 204 } }, { "ph": "f", "id": 24, "pid": 1336757, "tid": 1381170, "ts": 1295650769931.495, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650769956.005, "dur": 1.972, "args": { "External id": 17614,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650769960.124, "dur": 2974.260, "args": { "External id": 17615,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650769961.113, "dur": 2972.945, "args": { "External id": 17616,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650769964.104, "dur": 2.500, "args": { "External id": 17617,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650769967.283, "dur": 2965.701, "args": { "External id": 17618,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336757, "tid": 1381170, "ts": 1295650772937.683, "dur": 0.372, "args": { "External id": 17619,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336757, "tid": 1381170, "ts": 1295650772939.179, "dur": 2.008, "args": { "External id": 17620,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 211 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336757, "tid": 1381170, "ts": 1295650772940.231, "dur": 0.832, "args": { "External id": 17621,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336757, "tid": 1381170, "ts": 1295650772944.494, "dur": 20.998, "args": { "External id": 17622,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336757, "tid": 1381170, "ts": 1295650772969.578, "dur": 61.152, "args": { "External id": 17623,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336757, "tid": 1381170, "ts": 1295650772970.749, "dur": 59.816, "args": { "External id": 17624,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336757, "tid": 1381170, "ts": 1295650772972.261, "dur": 57.614, "args": { "External id": 17625,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650773048.263, "dur": 16.644, "args": { "External id": 17626,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 217 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650773084.118, "dur": 12.432, "args": { "External id": 17627,"Record function id": 0, "Ev Idx": 218 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650773086.929, "dur": 8.049, "args": { "External id": 17628,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650773089.844, "dur": 4.328, "args": { "External id": 17629,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 220 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650773090.770, "dur": 3.287, "args": { "External id": 17630,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 221 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773100.228, "dur": 9.328, "args": { "External id": 17631,"Record function id": 0, "Sequence number": 246743, "Fwd thread id": 1, "Ev Idx": 222 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773101.485, "dur": 6.166, "args": { "External id": 17632,"Sequence number": 246743, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 223 } }, { "ph": "f", "id": 25, "pid": 1336757, "tid": 1381170, "ts": 1295650773101.485, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650773103.791, "dur": 3.669, "args": { "External id": 17633,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650773105.017, "dur": 2.334, "args": { "External id": 17634,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 225 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773112.558, "dur": 63.904, "args": { "External id": 17635,"Record function id": 0, "Sequence number": 246742, "Fwd thread id": 1, "Ev Idx": 226 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773115.897, "dur": 55.977, "args": { "External id": 17636,"Sequence number": 246742, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 227 } }, { "ph": "f", "id": 26, "pid": 1336757, "tid": 1381170, "ts": 1295650773115.897, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650773117.859, "dur": 53.682, "args": { "External id": 17637,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650773120.134, "dur": 21.845, "args": { "External id": 17638,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650773121.617, "dur": 2.574, "args": { "External id": 17639,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650773124.909, "dur": 16.746, "args": { "External id": 17640,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650773126.290, "dur": 14.944, "args": { "External id": 17641,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650773143.335, "dur": 3.395, "args": { "External id": 17642,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650773145.722, "dur": 0.763, "args": { "External id": 17643,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650773147.498, "dur": 23.276, "args": { "External id": 17644,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 235 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773182.320, "dur": 61.803, "args": { "External id": 17645,"Record function id": 0, "Sequence number": 246741, "Fwd thread id": 1, "Ev Idx": 236 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773183.218, "dur": 57.677, "args": { "External id": 17646,"Sequence number": 246741, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 237 } }, { "ph": "f", "id": 27, "pid": 1336757, "tid": 1381170, "ts": 1295650773183.218, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650773185.226, "dur": 55.414, "args": { "External id": 17647,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650773189.027, "dur": 17.623, "args": { "External id": 17648,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650773190.103, "dur": 2.032, "args": { "External id": 17649,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650773192.738, "dur": 13.661, "args": { "External id": 17650,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650773193.681, "dur": 12.358, "args": { "External id": 17651,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1381170, "ts": 1295650773207.887, "dur": 4.986, "args": { "External id": 17652,"Record function id": 0, "Concrete Inputs": ["", "2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650773211.682, "dur": 0.715, "args": { "External id": 17653,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650773213.607, "dur": 26.160, "args": { "External id": 17654,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 245 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773249.549, "dur": 101.296, "args": { "External id": 17655,"Record function id": 0, "Sequence number": 246740, "Fwd thread id": 1, "Ev Idx": 246 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773250.544, "dur": 98.241, "args": { "External id": 17656,"Sequence number": 246740, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 247 } }, { "ph": "f", "id": 28, "pid": 1336757, "tid": 1381170, "ts": 1295650773250.544, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650773252.773, "dur": 95.577, "args": { "External id": 17657,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650773256.723, "dur": 24.215, "args": { "External id": 17658,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650773260.713, "dur": 2.497, "args": { "External id": 17659,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650773263.901, "dur": 16.767, "args": { "External id": 17660,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650773264.440, "dur": 15.868, "args": { "External id": 17661,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650773281.879, "dur": 4.604, "args": { "External id": 17662,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650773283.690, "dur": 2.537, "args": { "External id": 17663,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650773286.923, "dur": 60.858, "args": { "External id": 17664,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 255 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773354.507, "dur": 102.431, "args": { "External id": 17665,"Record function id": 0, "Sequence number": 246739, "Fwd thread id": 1, "Ev Idx": 256 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773355.376, "dur": 83.105, "args": { "External id": 17666,"Sequence number": 246739, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 257 } }, { "ph": "f", "id": 29, "pid": 1336757, "tid": 1381170, "ts": 1295650773355.376, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650773356.990, "dur": 81.226, "args": { "External id": 17667,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1381170, "ts": 1295650773357.997, "dur": 23.433, "args": { "External id": 17668,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650773361.176, "dur": 1.762, "args": { "External id": 17669,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1381170, "ts": 1295650773367.685, "dur": 13.482, "args": { "External id": 17670,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1381170, "ts": 1295650773369.663, "dur": 11.035, "args": { "External id": 17671,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650773382.358, "dur": 5.910, "args": { "External id": 17672,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650773387.574, "dur": 0.494, "args": { "External id": 17673,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650773389.035, "dur": 48.664, "args": { "External id": 17674,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650773442.033, "dur": 13.407, "args": { "External id": 17675,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 266 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650773462.774, "dur": 329.748, "args": { "External id": 17676,"Record function id": 0, "Sequence number": 246738, "Fwd thread id": 1, "Ev Idx": 267 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650773464.576, "dur": 321.130, "args": { "External id": 17677,"Sequence number": 246738, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 268 } }, { "ph": "f", "id": 30, "pid": 1336757, "tid": 1381170, "ts": 1295650773464.576, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295650773628.797, "dur": 41.849, "args": { "External id": 17678,"kernel_hash": "cl7ukpd4jntugtfn4xeypgd5onvbe6twamcfekvhw4dgeizu3kp2", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "262144", "2048", "1", "1986", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/l7/cl7ukpd4jntugtfn4xeypgd5onvbe6twamcfekvhw4dgeizu3kp2.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[262144, 2048], [2048], [262144, 2048], [262144, 2048], [132, 2048], [262144], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 269 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_0", "pid": 1336757, "tid": 1381170, "ts": 1295650773700.084, "dur": 27.293, "args": { "External id": 17679,"kernel_hash": "ctrxskj43j6wttul7meux4tf5uhrizad56rruyqg3gopczymn3ux", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/tr/ctrxskj43j6wttul7meux4tf5uhrizad56rruyqg3gopczymn3ux.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 270 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_1", "pid": 1336757, "tid": 1381170, "ts": 1295650773745.967, "dur": 18.528, "args": { "External id": 17680,"kernel_hash": "chk6naviqoas7yeoerriva67j5bcolw65yisn4ks734r66m7rt3g", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/hk/chk6naviqoas7yeoerriva67j5bcolw65yisn4ks734r66m7rt3g.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 271 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650773801.304, "dur": 12.511, "args": { "External id": 17681,"Record function id": 0, "Ev Idx": 272 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650773804.112, "dur": 8.923, "args": { "External id": 17682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650773806.911, "dur": 5.304, "args": { "External id": 17683,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 274 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650773809.099, "dur": 3.013, "args": { "External id": 17684,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 275 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: StackBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773819.942, "dur": 31.063, "args": { "External id": 17685,"Record function id": 0, "Sequence number": 246737, "Fwd thread id": 1, "Ev Idx": 276 } }, { "ph": "X", "cat": "cpu_op", "name": "StackBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773821.113, "dur": 23.749, "args": { "External id": 17686,"Sequence number": 246737, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 277 } }, { "ph": "f", "id": 31, "pid": 1336757, "tid": 1381170, "ts": 1295650773821.113, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1381170, "ts": 1295650773823.735, "dur": 8.597, "args": { "External id": 17687,"Record function id": 0, "Concrete Inputs": ["", "-2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650773829.514, "dur": 0.935, "args": { "External id": 17688,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1381170, "ts": 1295650773832.913, "dur": 4.022, "args": { "External id": 17689,"Record function id": 0, "Concrete Inputs": ["", "-2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650773835.712, "dur": 0.461, "args": { "External id": 17690,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1381170, "ts": 1295650773837.316, "dur": 3.139, "args": { "External id": 17691,"Record function id": 0, "Concrete Inputs": ["", "-2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650773839.228, "dur": 0.291, "args": { "External id": 17692,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1381170, "ts": 1295650773840.946, "dur": 3.404, "args": { "External id": 17693,"Record function id": 0, "Concrete Inputs": ["", "-2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650773843.175, "dur": 0.433, "args": { "External id": 17694,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 285 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773854.680, "dur": 5.236, "args": { "External id": 17695,"Record function id": 0, "Sequence number": 246736, "Fwd thread id": 1, "Ev Idx": 286 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650773855.620, "dur": 1.088, "args": { "External id": 17696,"Sequence number": 246736, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 287 } }, { "ph": "f", "id": 32, "pid": 1336757, "tid": 1381170, "ts": 1295650773855.620, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650773864.148, "dur": 580.196, "args": { "External id": 17697,"Record function id": 0, "Sequence number": 246735, "Fwd thread id": 1, "Ev Idx": 288 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650773865.813, "dur": 565.986, "args": { "External id": 17698,"Sequence number": 246735, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 289 } }, { "ph": "f", "id": 33, "pid": 1336757, "tid": 1381170, "ts": 1295650773865.813, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650773902.405, "dur": 11.468, "args": { "External id": 17699,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336757, "tid": 1381170, "ts": 1295650773908.945, "dur": 4.575, "args": { "External id": 17700,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650773918.007, "dur": 8.277, "args": { "External id": 17701,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650773920.415, "dur": 4.918, "args": { "External id": 17702,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650773924.604, "dur": 0.514, "args": { "External id": 17703,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1381170, "ts": 1295650773930.123, "dur": 170.787, "args": { "External id": 17704,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650773930.932, "dur": 5.469, "args": { "External id": 17705,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650773931.758, "dur": 3.947, "args": { "External id": 17706,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650773933.384, "dur": 2.187, "args": { "External id": 17707,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1381170, "ts": 1295650773937.816, "dur": 162.125, "args": { "External id": 17708,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650773941.163, "dur": 157.074, "args": { "External id": 17709,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650774107.784, "dur": 5.307, "args": { "External id": 17710,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650774109.977, "dur": 3.006, "args": { "External id": 17711,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650774149.124, "dur": 5.454, "args": { "External id": 17712,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650774156.159, "dur": 3.924, "args": { "External id": 17713,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650774161.544, "dur": 1.433, "args": { "External id": 17714,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650774201.690, "dur": 2.485, "args": { "External id": 17715,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650774202.689, "dur": 1.335, "args": { "External id": 17716,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336757, "tid": 1381170, "ts": 1295650774243.760, "dur": 166.753, "args": { "External id": 17717,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1381170, "ts": 1295650774250.814, "dur": 9.941, "args": { "External id": 17718,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774256.593, "dur": 1.019, "args": { "External id": 17719,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650774263.284, "dur": 8.909, "args": { "External id": 17720,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774268.850, "dur": 2.588, "args": { "External id": 17721,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1381170, "ts": 1295650774274.562, "dur": 2.873, "args": { "External id": 17722,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774276.489, "dur": 0.547, "args": { "External id": 17723,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650774278.794, "dur": 2.737, "args": { "External id": 17724,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774280.561, "dur": 0.548, "args": { "External id": 17725,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650774288.890, "dur": 3.321, "args": { "External id": 17726,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774291.481, "dur": 0.395, "args": { "External id": 17727,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650774293.583, "dur": 7.353, "args": { "External id": 17728,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336757, "tid": 1381170, "ts": 1295650774298.329, "dur": 2.408, "args": { "External id": 17729,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650774302.096, "dur": 2.529, "args": { "External id": 17730,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774303.982, "dur": 0.277, "args": { "External id": 17731,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650774305.741, "dur": 2.338, "args": { "External id": 17732,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650774306.803, "dur": 1.171, "args": { "External id": 17733,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295650774309.603, "dur": 84.696, "args": { "External id": 17734,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650774398.680, "dur": 2.909, "args": { "External id": 17735,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650774402.828, "dur": 3.503, "args": { "External id": 17736,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774405.355, "dur": 0.514, "args": { "External id": 17737,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650774408.525, "dur": 0.883, "args": { "External id": 17738,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 329 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650774458.781, "dur": 11.043, "args": { "External id": 17739,"Record function id": 0, "Ev Idx": 330 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650774461.540, "dur": 7.380, "args": { "External id": 17740,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650774464.169, "dur": 4.044, "args": { "External id": 17741,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 332 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650774465.528, "dur": 2.529, "args": { "External id": 17742,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 333 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774474.553, "dur": 9.332, "args": { "External id": 17743,"Record function id": 0, "Sequence number": 246734, "Fwd thread id": 1, "Ev Idx": 334 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774476.115, "dur": 5.590, "args": { "External id": 17744,"Sequence number": 246734, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 335 } }, { "ph": "f", "id": 34, "pid": 1336757, "tid": 1381170, "ts": 1295650774476.115, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650774477.768, "dur": 3.738, "args": { "External id": 17745,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650774480.442, "dur": 0.976, "args": { "External id": 17746,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 337 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774487.757, "dur": 175.238, "args": { "External id": 17747,"Record function id": 0, "Sequence number": 246733, "Fwd thread id": 1, "Ev Idx": 338 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774488.585, "dur": 168.289, "args": { "External id": 17748,"Sequence number": 246733, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 339 } }, { "ph": "f", "id": 35, "pid": 1336757, "tid": 1381170, "ts": 1295650774488.585, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650774491.792, "dur": 4.796, "args": { "External id": 17749,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650774493.144, "dur": 2.881, "args": { "External id": 17750,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774495.392, "dur": 0.447, "args": { "External id": 17751,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650774498.021, "dur": 62.456, "args": { "External id": 17752,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650774563.781, "dur": 4.414, "args": { "External id": 17753,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650774564.759, "dur": 2.669, "args": { "External id": 17754,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774566.553, "dur": 0.675, "args": { "External id": 17755,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650774569.975, "dur": 3.473, "args": { "External id": 17756,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650774570.717, "dur": 2.230, "args": { "External id": 17757,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774572.334, "dur": 0.493, "args": { "External id": 17758,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650774576.183, "dur": 79.924, "args": { "External id": 17759,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 350 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774667.824, "dur": 6.744, "args": { "External id": 17760,"Record function id": 0, "Sequence number": 246732, "Fwd thread id": 1, "Ev Idx": 351 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774668.900, "dur": 4.449, "args": { "External id": 17761,"Sequence number": 246732, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 352 } }, { "ph": "f", "id": 36, "pid": 1336757, "tid": 1381170, "ts": 1295650774668.900, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650774670.590, "dur": 2.614, "args": { "External id": 17762,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650774671.760, "dur": 1.300, "args": { "External id": 17763,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 354 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774678.166, "dur": 10.826, "args": { "External id": 17764,"Record function id": 0, "Sequence number": 246731, "Fwd thread id": 1, "Ev Idx": 355 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774679.456, "dur": 7.231, "args": { "External id": 17765,"Sequence number": 246731, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 356 } }, { "ph": "f", "id": 37, "pid": 1336757, "tid": 1381170, "ts": 1295650774679.456, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650774680.374, "dur": 6.086, "args": { "External id": 17766,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650774681.249, "dur": 4.676, "args": { "External id": 17767,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774685.388, "dur": 0.426, "args": { "External id": 17768,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 359 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650774693.411, "dur": 5.676, "args": { "External id": 17769,"Record function id": 0, "Ev Idx": 360 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650774695.041, "dur": 3.519, "args": { "External id": 17770,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650774696.297, "dur": 1.991, "args": { "External id": 17771,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 362 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650774697.161, "dur": 1.012, "args": { "External id": 17772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 363 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774702.667, "dur": 6.186, "args": { "External id": 17773,"Record function id": 0, "Sequence number": 246730, "Fwd thread id": 1, "Ev Idx": 364 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774704.071, "dur": 2.776, "args": { "External id": 17774,"Sequence number": 246730, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 365 } }, { "ph": "f", "id": 38, "pid": 1336757, "tid": 1381170, "ts": 1295650774704.071, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650774704.963, "dur": 1.748, "args": { "External id": 17775,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650774705.771, "dur": 0.788, "args": { "External id": 17776,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 367 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774711.918, "dur": 152.339, "args": { "External id": 17777,"Record function id": 0, "Sequence number": 246729, "Fwd thread id": 1, "Ev Idx": 368 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774712.826, "dur": 144.765, "args": { "External id": 17778,"Sequence number": 246729, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 369 } }, { "ph": "f", "id": 39, "pid": 1336757, "tid": 1381170, "ts": 1295650774712.826, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650774717.273, "dur": 2.780, "args": { "External id": 17779,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650774717.653, "dur": 1.960, "args": { "External id": 17780,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774719.006, "dur": 0.487, "args": { "External id": 17781,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650774720.761, "dur": 48.358, "args": { "External id": 17782,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650774770.215, "dur": 5.683, "args": { "External id": 17783,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650774770.815, "dur": 4.518, "args": { "External id": 17784,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774774.283, "dur": 0.929, "args": { "External id": 17785,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650774776.812, "dur": 4.424, "args": { "External id": 17786,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650774777.436, "dur": 3.356, "args": { "External id": 17787,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774778.972, "dur": 1.719, "args": { "External id": 17788,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650774781.755, "dur": 75.088, "args": { "External id": 17789,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 380 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774871.058, "dur": 33.825, "args": { "External id": 17790,"Record function id": 0, "Sequence number": 246728, "Fwd thread id": 1, "Ev Idx": 381 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774871.787, "dur": 4.170, "args": { "External id": 17791,"Sequence number": 246728, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 382 } }, { "ph": "f", "id": 40, "pid": 1336757, "tid": 1381170, "ts": 1295650774871.787, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650774873.431, "dur": 2.386, "args": { "External id": 17792,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650774874.651, "dur": 1.072, "args": { "External id": 17793,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1381170, "ts": 1295650774879.034, "dur": 23.490, "args": { "External id": 17794,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 385 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774911.052, "dur": 8.082, "args": { "External id": 17795,"Record function id": 0, "Sequence number": 246727, "Fwd thread id": 1, "Ev Idx": 386 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650774912.108, "dur": 4.694, "args": { "External id": 17796,"Sequence number": 246727, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 387 } }, { "ph": "f", "id": 41, "pid": 1336757, "tid": 1381170, "ts": 1295650774912.108, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650774912.997, "dur": 3.596, "args": { "External id": 17797,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650774913.837, "dur": 2.225, "args": { "External id": 17798,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650774915.617, "dur": 0.316, "args": { "External id": 17799,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 390 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650774923.013, "dur": 4.854, "args": { "External id": 17800,"Record function id": 0, "Ev Idx": 391 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650774924.779, "dur": 2.646, "args": { "External id": 17801,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650774925.500, "dur": 1.627, "args": { "External id": 17802,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 393 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650774926.273, "dur": 0.748, "args": { "External id": 17803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 394 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650774932.692, "dur": 501.519, "args": { "External id": 17804,"Record function id": 0, "Sequence number": 246726, "Fwd thread id": 1, "Ev Idx": 395 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650774934.902, "dur": 485.427, "args": { "External id": 17805,"Sequence number": 246726, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 396 } }, { "ph": "f", "id": 42, "pid": 1336757, "tid": 1381170, "ts": 1295650774934.902, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1381170, "ts": 1295650774958.258, "dur": 87.510, "args": { "External id": 17806,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650774959.716, "dur": 85.719, "args": { "External id": 17807,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650774962.547, "dur": 8.617, "args": { "External id": 17808,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650774967.856, "dur": 2.719, "args": { "External id": 17809,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650774972.678, "dur": 71.692, "args": { "External id": 17810,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650775059.219, "dur": 3.254, "args": { "External id": 17811,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650775060.573, "dur": 1.794, "args": { "External id": 17812,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650775066.100, "dur": 6.214, "args": { "External id": 17813,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650775069.379, "dur": 2.804, "args": { "External id": 17814,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650775085.151, "dur": 3.056, "args": { "External id": 17815,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650775099.575, "dur": 3.800, "args": { "External id": 17816,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650775299.653, "dur": 3.582, "args": { "External id": 17817,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650775307.909, "dur": 39.024, "args": { "External id": 17818,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650775321.063, "dur": 1.165, "args": { "External id": 17819,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650775353.027, "dur": 33.061, "args": { "External id": 17820,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650775355.430, "dur": 30.441, "args": { "External id": 17821,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650775361.995, "dur": 4.240, "args": { "External id": 17822,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650775367.541, "dur": 17.881, "args": { "External id": 17823,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650775390.667, "dur": 2.990, "args": { "External id": 17824,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650775392.451, "dur": 1.060, "args": { "External id": 17825,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650775400.246, "dur": 2.467, "args": { "External id": 17826,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650775401.248, "dur": 1.305, "args": { "External id": 17827,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650775406.988, "dur": 3.865, "args": { "External id": 17828,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650775408.591, "dur": 2.170, "args": { "External id": 17829,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 420 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650775448.913, "dur": 10.168, "args": { "External id": 17830,"Record function id": 0, "Ev Idx": 421 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650775451.528, "dur": 6.817, "args": { "External id": 17831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650775453.932, "dur": 3.492, "args": { "External id": 17832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 423 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650775455.133, "dur": 2.184, "args": { "External id": 17833,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 424 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650775463.602, "dur": 10.567, "args": { "External id": 17834,"Record function id": 0, "Sequence number": 246725, "Fwd thread id": 1, "Ev Idx": 425 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650775464.955, "dur": 6.558, "args": { "External id": 17835,"Sequence number": 246725, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 426 } }, { "ph": "f", "id": 43, "pid": 1336757, "tid": 1381170, "ts": 1295650775464.955, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650775468.892, "dur": 2.399, "args": { "External id": 17836,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650775469.944, "dur": 1.210, "args": { "External id": 17837,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 428 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650775478.093, "dur": 145.122, "args": { "External id": 17838,"Record function id": 0, "Sequence number": 246724, "Fwd thread id": 1, "Ev Idx": 429 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650775479.115, "dur": 140.274, "args": { "External id": 17839,"Sequence number": 246724, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 430 } }, { "ph": "f", "id": 44, "pid": 1336757, "tid": 1381170, "ts": 1295650775479.115, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650775481.730, "dur": 7.482, "args": { "External id": 17840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650775483.383, "dur": 5.087, "args": { "External id": 17841,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650775487.329, "dur": 0.933, "args": { "External id": 17842,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650775490.420, "dur": 62.039, "args": { "External id": 17843,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650775553.546, "dur": 5.978, "args": { "External id": 17844,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650775554.401, "dur": 4.273, "args": { "External id": 17845,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650775556.545, "dur": 1.948, "args": { "External id": 17846,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650775561.089, "dur": 5.592, "args": { "External id": 17847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650775561.805, "dur": 4.407, "args": { "External id": 17848,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650775565.693, "dur": 0.448, "args": { "External id": 17849,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650775567.105, "dur": 51.311, "args": { "External id": 17850,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 441 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650775627.664, "dur": 9.878, "args": { "External id": 17851,"Record function id": 0, "Sequence number": 246723, "Fwd thread id": 1, "Ev Idx": 442 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650775628.665, "dur": 6.430, "args": { "External id": 17852,"Sequence number": 246723, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 443 } }, { "ph": "f", "id": 45, "pid": 1336757, "tid": 1381170, "ts": 1295650775628.665, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650775630.514, "dur": 4.443, "args": { "External id": 17853,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650775631.943, "dur": 2.829, "args": { "External id": 17854,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 445 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650775641.160, "dur": 9.737, "args": { "External id": 17855,"Record function id": 0, "Sequence number": 246722, "Fwd thread id": 1, "Ev Idx": 446 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650775641.919, "dur": 6.782, "args": { "External id": 17856,"Sequence number": 246722, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 447 } }, { "ph": "f", "id": 46, "pid": 1336757, "tid": 1381170, "ts": 1295650775641.919, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650775642.822, "dur": 5.671, "args": { "External id": 17857,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650775643.757, "dur": 4.235, "args": { "External id": 17858,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650775647.528, "dur": 0.363, "args": { "External id": 17859,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 450 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650775655.108, "dur": 5.312, "args": { "External id": 17860,"Record function id": 0, "Ev Idx": 451 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650775656.619, "dur": 3.298, "args": { "External id": 17861,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650775657.827, "dur": 1.794, "args": { "External id": 17862,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 453 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650775658.485, "dur": 1.070, "args": { "External id": 17863,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 454 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650775663.436, "dur": 6.509, "args": { "External id": 17864,"Record function id": 0, "Sequence number": 246721, "Fwd thread id": 1, "Ev Idx": 455 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650775664.224, "dur": 3.629, "args": { "External id": 17865,"Sequence number": 246721, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 456 } }, { "ph": "f", "id": 47, "pid": 1336757, "tid": 1381170, "ts": 1295650775664.224, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650775665.358, "dur": 2.342, "args": { "External id": 17866,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650775666.223, "dur": 1.328, "args": { "External id": 17867,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 458 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650775674.655, "dur": 298.401, "args": { "External id": 17868,"Record function id": 0, "Sequence number": 246720, "Fwd thread id": 1, "Ev Idx": 459 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650775676.630, "dur": 279.172, "args": { "External id": 17869,"Sequence number": 246720, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 460 } }, { "ph": "f", "id": 48, "pid": 1336757, "tid": 1381170, "ts": 1295650775676.630, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650775691.930, "dur": 6.506, "args": { "External id": 17870,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650775694.849, "dur": 3.140, "args": { "External id": 17871,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650775700.864, "dur": 3.821, "args": { "External id": 17872,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650775702.796, "dur": 1.681, "args": { "External id": 17873,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650775706.159, "dur": 5.589, "args": { "External id": 17874,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650775708.185, "dur": 3.349, "args": { "External id": 17875,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 466 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650775740.768, "dur": 191.223, "args": { "External id": 17876,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650775825.491, "dur": 3.299, "args": { "External id": 17877,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650775830.550, "dur": 3.407, "args": { "External id": 17878,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650775943.531, "dur": 3.342, "args": { "External id": 17879,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650775949.866, "dur": 0.804, "args": { "External id": 17880,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650775952.519, "dur": 0.724, "args": { "External id": 17881,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 472 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650775980.104, "dur": 292.591, "args": { "External id": 17882,"Record function id": 0, "Sequence number": 246719, "Fwd thread id": 1, "Ev Idx": 473 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650775981.863, "dur": 281.131, "args": { "External id": 17883,"Sequence number": 246719, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 474 } }, { "ph": "f", "id": 49, "pid": 1336757, "tid": 1381170, "ts": 1295650775981.863, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650776043.518, "dur": 50.524, "args": { "External id": 17884,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776047.593, "dur": 4.115, "args": { "External id": 17885,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650776053.104, "dur": 40.405, "args": { "External id": 17886,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650776103.788, "dur": 4.853, "args": { "External id": 17887,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776106.048, "dur": 2.276, "args": { "External id": 17888,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 479 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650776283.692, "dur": 161.982, "args": { "External id": 17889,"Record function id": 0, "Sequence number": 246718, "Fwd thread id": 1, "Ev Idx": 480 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650776286.338, "dur": 153.406, "args": { "External id": 17890,"Sequence number": 246718, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 481 } }, { "ph": "f", "id": 50, "pid": 1336757, "tid": 1381170, "ts": 1295650776286.338, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650776299.757, "dur": 34.042, "args": { "External id": 17891,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776302.784, "dur": 3.258, "args": { "External id": 17892,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650776307.178, "dur": 26.150, "args": { "External id": 17893,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650776341.330, "dur": 5.526, "args": { "External id": 17894,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776343.787, "dur": 2.653, "args": { "External id": 17895,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 486 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776451.682, "dur": 14.557, "args": { "External id": 17896,"Record function id": 0, "Sequence number": 246717, "Fwd thread id": 1, "Ev Idx": 487 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776452.943, "dur": 10.487, "args": { "External id": 17897,"Sequence number": 246717, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 488 } }, { "ph": "f", "id": 51, "pid": 1336757, "tid": 1381170, "ts": 1295650776452.943, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650776455.795, "dur": 7.382, "args": { "External id": 17898,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650776457.315, "dur": 5.570, "args": { "External id": 17899,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 490 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776469.823, "dur": 9.253, "args": { "External id": 17900,"Record function id": 0, "Sequence number": 246716, "Fwd thread id": 1, "Ev Idx": 491 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776470.816, "dur": 6.471, "args": { "External id": 17901,"Sequence number": 246716, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 492 } }, { "ph": "f", "id": 52, "pid": 1336757, "tid": 1381170, "ts": 1295650776470.816, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650776472.567, "dur": 4.579, "args": { "External id": 17902,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650776476.027, "dur": 1.020, "args": { "External id": 17903,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 494 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776482.255, "dur": 6.767, "args": { "External id": 17904,"Record function id": 0, "Sequence number": 246715, "Fwd thread id": 1, "Ev Idx": 495 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776483.182, "dur": 3.975, "args": { "External id": 17905,"Sequence number": 246715, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 496 } }, { "ph": "f", "id": 53, "pid": 1336757, "tid": 1381170, "ts": 1295650776483.182, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650776484.746, "dur": 2.267, "args": { "External id": 17906,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650776485.914, "dur": 0.977, "args": { "External id": 17907,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 498 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776492.460, "dur": 6.479, "args": { "External id": 17908,"Record function id": 0, "Sequence number": 246714, "Fwd thread id": 1, "Ev Idx": 499 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776493.731, "dur": 3.191, "args": { "External id": 17909,"Sequence number": 246714, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 500 } }, { "ph": "f", "id": 54, "pid": 1336757, "tid": 1381170, "ts": 1295650776493.731, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650776495.033, "dur": 1.750, "args": { "External id": 17910,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650776495.901, "dur": 0.748, "args": { "External id": 17911,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 502 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776502.191, "dur": 177.187, "args": { "External id": 17912,"Record function id": 0, "Sequence number": 246713, "Fwd thread id": 1, "Ev Idx": 503 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776505.417, "dur": 167.345, "args": { "External id": 17913,"Sequence number": 246713, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 504 } }, { "ph": "f", "id": 55, "pid": 1336757, "tid": 1381170, "ts": 1295650776505.417, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650776509.225, "dur": 7.083, "args": { "External id": 17914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650776511.265, "dur": 4.428, "args": { "External id": 17915,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776513.858, "dur": 1.553, "args": { "External id": 17916,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650776518.030, "dur": 69.367, "args": { "External id": 17917,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650776588.694, "dur": 6.354, "args": { "External id": 17918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650776589.441, "dur": 5.002, "args": { "External id": 17919,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776593.219, "dur": 1.061, "args": { "External id": 17920,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650776622.676, "dur": 2.892, "args": { "External id": 17921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650776623.416, "dur": 1.635, "args": { "External id": 17922,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776624.587, "dur": 0.399, "args": { "External id": 17923,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650776626.281, "dur": 45.544, "args": { "External id": 17924,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 515 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776684.241, "dur": 8.328, "args": { "External id": 17925,"Record function id": 0, "Sequence number": 246712, "Fwd thread id": 1, "Ev Idx": 516 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776684.999, "dur": 5.704, "args": { "External id": 17926,"Sequence number": 246712, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 517 } }, { "ph": "f", "id": 56, "pid": 1336757, "tid": 1381170, "ts": 1295650776684.999, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650776686.555, "dur": 4.001, "args": { "External id": 17927,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650776689.312, "dur": 1.129, "args": { "External id": 17928,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 519 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776695.825, "dur": 7.727, "args": { "External id": 17929,"Record function id": 0, "Sequence number": 246711, "Fwd thread id": 1, "Ev Idx": 520 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776697.174, "dur": 4.658, "args": { "External id": 17930,"Sequence number": 246711, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 521 } }, { "ph": "f", "id": 57, "pid": 1336757, "tid": 1381170, "ts": 1295650776697.174, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650776697.785, "dur": 3.829, "args": { "External id": 17931,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650776698.454, "dur": 2.660, "args": { "External id": 17932,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776700.509, "dur": 0.499, "args": { "External id": 17933,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 524 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650776709.819, "dur": 11.716, "args": { "External id": 17934,"Record function id": 0, "Ev Idx": 525 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650776711.667, "dur": 9.113, "args": { "External id": 17935,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650776714.158, "dur": 6.287, "args": { "External id": 17936,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 527 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650776717.593, "dur": 2.731, "args": { "External id": 17937,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 528 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776727.346, "dur": 6.917, "args": { "External id": 17938,"Record function id": 0, "Sequence number": 246710, "Fwd thread id": 1, "Ev Idx": 529 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776728.932, "dur": 3.034, "args": { "External id": 17939,"Sequence number": 246710, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 530 } }, { "ph": "f", "id": 58, "pid": 1336757, "tid": 1381170, "ts": 1295650776728.932, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650776729.974, "dur": 1.837, "args": { "External id": 17940,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650776730.849, "dur": 0.842, "args": { "External id": 17941,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 532 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776737.486, "dur": 90.366, "args": { "External id": 17942,"Record function id": 0, "Sequence number": 246709, "Fwd thread id": 1, "Ev Idx": 533 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776738.150, "dur": 83.952, "args": { "External id": 17943,"Sequence number": 246709, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 534 } }, { "ph": "f", "id": 59, "pid": 1336757, "tid": 1381170, "ts": 1295650776738.150, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650776740.557, "dur": 5.204, "args": { "External id": 17944,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650776741.149, "dur": 4.147, "args": { "External id": 17945,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776744.809, "dur": 0.378, "args": { "External id": 17946,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650776746.373, "dur": 28.306, "args": { "External id": 17947,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650776775.727, "dur": 4.096, "args": { "External id": 17948,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650776776.394, "dur": 2.799, "args": { "External id": 17949,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776778.140, "dur": 0.930, "args": { "External id": 17950,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650776780.795, "dur": 6.743, "args": { "External id": 17951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650776783.864, "dur": 3.185, "args": { "External id": 17952,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776785.123, "dur": 1.853, "args": { "External id": 17953,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650776787.962, "dur": 33.449, "args": { "External id": 17954,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 545 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776832.235, "dur": 31.066, "args": { "External id": 17955,"Record function id": 0, "Sequence number": 246708, "Fwd thread id": 1, "Ev Idx": 546 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776833.060, "dur": 3.706, "args": { "External id": 17956,"Sequence number": 246708, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 547 } }, { "ph": "f", "id": 60, "pid": 1336757, "tid": 1381170, "ts": 1295650776833.060, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650776834.682, "dur": 1.926, "args": { "External id": 17957,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650776835.587, "dur": 0.886, "args": { "External id": 17958,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1381170, "ts": 1295650776839.795, "dur": 21.256, "args": { "External id": 17959,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 550 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776867.207, "dur": 9.911, "args": { "External id": 17960,"Record function id": 0, "Sequence number": 246707, "Fwd thread id": 1, "Ev Idx": 551 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776868.002, "dur": 7.475, "args": { "External id": 17961,"Sequence number": 246707, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 552 } }, { "ph": "f", "id": 61, "pid": 1336757, "tid": 1381170, "ts": 1295650776868.002, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650776871.332, "dur": 3.945, "args": { "External id": 17962,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650776872.075, "dur": 2.652, "args": { "External id": 17963,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776874.079, "dur": 0.509, "args": { "External id": 17964,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 555 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650776881.102, "dur": 4.969, "args": { "External id": 17965,"Record function id": 0, "Ev Idx": 556 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650776882.866, "dur": 2.680, "args": { "External id": 17966,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650776883.609, "dur": 1.631, "args": { "External id": 17967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 558 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650776884.207, "dur": 0.933, "args": { "External id": 17968,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 559 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776889.557, "dur": 9.149, "args": { "External id": 17969,"Record function id": 0, "Sequence number": 246706, "Fwd thread id": 1, "Ev Idx": 560 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776890.817, "dur": 5.658, "args": { "External id": 17970,"Sequence number": 246706, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 561 } }, { "ph": "f", "id": 62, "pid": 1336757, "tid": 1381170, "ts": 1295650776890.817, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650776891.968, "dur": 4.355, "args": { "External id": 17971,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650776895.438, "dur": 0.794, "args": { "External id": 17972,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 563 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776902.183, "dur": 127.647, "args": { "External id": 17973,"Record function id": 0, "Sequence number": 246705, "Fwd thread id": 1, "Ev Idx": 564 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650776902.839, "dur": 80.719, "args": { "External id": 17974,"Sequence number": 246705, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 565 } }, { "ph": "f", "id": 63, "pid": 1336757, "tid": 1381170, "ts": 1295650776902.839, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650776904.936, "dur": 3.420, "args": { "External id": 17975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650776905.389, "dur": 2.466, "args": { "External id": 17976,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776907.242, "dur": 0.503, "args": { "External id": 17977,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650776909.186, "dur": 28.191, "args": { "External id": 17978,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650776940.459, "dur": 3.667, "args": { "External id": 17979,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650776940.914, "dur": 2.569, "args": { "External id": 17980,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776942.847, "dur": 0.519, "args": { "External id": 17981,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650776945.172, "dur": 2.721, "args": { "External id": 17982,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650776945.609, "dur": 1.858, "args": { "External id": 17983,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650776947.087, "dur": 0.265, "args": { "External id": 17984,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650776950.587, "dur": 32.325, "args": { "External id": 17985,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 576 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650777037.144, "dur": 30.420, "args": { "External id": 17986,"Record function id": 0, "Sequence number": 246704, "Fwd thread id": 1, "Ev Idx": 577 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650777038.437, "dur": 4.735, "args": { "External id": 17987,"Sequence number": 246704, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 578 } }, { "ph": "f", "id": 64, "pid": 1336757, "tid": 1381170, "ts": 1295650777038.437, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650777040.349, "dur": 2.632, "args": { "External id": 17988,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650777041.189, "dur": 1.656, "args": { "External id": 17989,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650777045.715, "dur": 19.862, "args": { "External id": 17990,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 581 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650777071.274, "dur": 12.026, "args": { "External id": 17991,"Record function id": 0, "Sequence number": 246703, "Fwd thread id": 1, "Ev Idx": 582 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650777072.189, "dur": 9.367, "args": { "External id": 17992,"Sequence number": 246703, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 583 } }, { "ph": "f", "id": 65, "pid": 1336757, "tid": 1381170, "ts": 1295650777072.189, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650777072.878, "dur": 8.415, "args": { "External id": 17993,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650777076.427, "dur": 4.213, "args": { "External id": 17994,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777079.958, "dur": 0.524, "args": { "External id": 17995,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 586 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650777087.713, "dur": 5.401, "args": { "External id": 17996,"Record function id": 0, "Ev Idx": 587 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650777089.115, "dur": 3.539, "args": { "External id": 17997,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650777090.219, "dur": 2.102, "args": { "External id": 17998,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 589 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650777090.890, "dur": 1.323, "args": { "External id": 17999,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 590 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650777097.545, "dur": 377.886, "args": { "External id": 18000,"Record function id": 0, "Sequence number": 246702, "Fwd thread id": 1, "Ev Idx": 591 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650777099.130, "dur": 342.511, "args": { "External id": 18001,"Sequence number": 246702, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 592 } }, { "ph": "f", "id": 66, "pid": 1336757, "tid": 1381170, "ts": 1295650777099.130, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650777131.026, "dur": 1.851, "args": { "External id": 18002,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650777131.763, "dur": 0.965, "args": { "External id": 18003,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650777148.874, "dur": 5.581, "args": { "External id": 18004,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650777163.970, "dur": 1.967, "args": { "External id": 18005,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650777334.210, "dur": 2.961, "args": { "External id": 18006,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650777341.596, "dur": 37.872, "args": { "External id": 18007,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777352.703, "dur": 1.075, "args": { "External id": 18008,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650777385.367, "dur": 31.861, "args": { "External id": 18009,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650777387.420, "dur": 29.599, "args": { "External id": 18010,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777391.564, "dur": 5.067, "args": { "External id": 18011,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650777398.552, "dur": 17.956, "args": { "External id": 18012,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650777424.137, "dur": 2.518, "args": { "External id": 18013,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650777425.451, "dur": 1.105, "args": { "External id": 18014,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650777432.920, "dur": 2.040, "args": { "External id": 18015,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650777434.059, "dur": 0.814, "args": { "External id": 18016,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1381170, "ts": 1295650777452.024, "dur": 18.025, "args": { "External id": 18017,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 608 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650777487.327, "dur": 12.296, "args": { "External id": 18018,"Record function id": 0, "Ev Idx": 609 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650777489.917, "dur": 9.026, "args": { "External id": 18019,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650777492.510, "dur": 5.539, "args": { "External id": 18020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 611 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650777496.277, "dur": 1.666, "args": { "External id": 18021,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 612 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650777505.954, "dur": 6.047, "args": { "External id": 18022,"Record function id": 0, "Sequence number": 246701, "Fwd thread id": 1, "Ev Idx": 613 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650777507.159, "dur": 1.152, "args": { "External id": 18023,"Sequence number": 246701, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 614 } }, { "ph": "f", "id": 67, "pid": 1336757, "tid": 1381170, "ts": 1295650777507.159, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650777515.922, "dur": 398.027, "args": { "External id": 18024,"Record function id": 0, "Sequence number": 246700, "Fwd thread id": 1, "Ev Idx": 615 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650777517.470, "dur": 386.273, "args": { "External id": 18025,"Sequence number": 246700, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 616 } }, { "ph": "f", "id": 68, "pid": 1336757, "tid": 1381170, "ts": 1295650777517.470, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650777544.802, "dur": 8.810, "args": { "External id": 18026,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336757, "tid": 1381170, "ts": 1295650777550.207, "dur": 3.124, "args": { "External id": 18027,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650777556.623, "dur": 7.732, "args": { "External id": 18028,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650777558.467, "dur": 5.318, "args": { "External id": 18029,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777562.909, "dur": 0.710, "args": { "External id": 18030,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1381170, "ts": 1295650777567.982, "dur": 90.545, "args": { "External id": 18031,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650777568.861, "dur": 4.816, "args": { "External id": 18032,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650777569.759, "dur": 3.446, "args": { "External id": 18033,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777571.284, "dur": 1.817, "args": { "External id": 18034,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1381170, "ts": 1295650777575.145, "dur": 82.902, "args": { "External id": 18035,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650777578.174, "dur": 79.197, "args": { "External id": 18036,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650777662.453, "dur": 3.049, "args": { "External id": 18037,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650777664.038, "dur": 1.367, "args": { "External id": 18038,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650777696.693, "dur": 4.374, "args": { "External id": 18039,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650777702.513, "dur": 1.760, "args": { "External id": 18040,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650777705.289, "dur": 1.677, "args": { "External id": 18041,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650777742.397, "dur": 2.513, "args": { "External id": 18042,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650777743.413, "dur": 1.324, "args": { "External id": 18043,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336757, "tid": 1381170, "ts": 1295650777765.048, "dur": 123.185, "args": { "External id": 18044,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1381170, "ts": 1295650777770.650, "dur": 5.844, "args": { "External id": 18045,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777774.869, "dur": 0.785, "args": { "External id": 18046,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650777778.240, "dur": 7.383, "args": { "External id": 18047,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777782.732, "dur": 2.149, "args": { "External id": 18048,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1381170, "ts": 1295650777787.008, "dur": 3.068, "args": { "External id": 18049,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777789.190, "dur": 0.509, "args": { "External id": 18050,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650777791.321, "dur": 3.323, "args": { "External id": 18051,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777793.545, "dur": 0.595, "args": { "External id": 18052,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650777800.449, "dur": 3.336, "args": { "External id": 18053,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777802.956, "dur": 0.508, "args": { "External id": 18054,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650777805.008, "dur": 5.522, "args": { "External id": 18055,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336757, "tid": 1381170, "ts": 1295650777808.788, "dur": 1.541, "args": { "External id": 18056,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650777811.778, "dur": 2.681, "args": { "External id": 18057,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777813.825, "dur": 0.344, "args": { "External id": 18058,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650777815.425, "dur": 3.473, "args": { "External id": 18059,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650777816.625, "dur": 2.173, "args": { "External id": 18060,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295650777820.484, "dur": 51.591, "args": { "External id": 18061,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650777876.534, "dur": 2.445, "args": { "External id": 18062,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650777879.979, "dur": 3.849, "args": { "External id": 18063,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777882.909, "dur": 0.430, "args": { "External id": 18064,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650777886.162, "dur": 0.725, "args": { "External id": 18065,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 656 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650777922.663, "dur": 8.299, "args": { "External id": 18066,"Record function id": 0, "Ev Idx": 657 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650777924.978, "dur": 5.359, "args": { "External id": 18067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650777926.883, "dur": 2.658, "args": { "External id": 18068,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 659 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650777927.723, "dur": 1.689, "args": { "External id": 18069,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 660 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650777934.958, "dur": 9.582, "args": { "External id": 18070,"Record function id": 0, "Sequence number": 246699, "Fwd thread id": 1, "Ev Idx": 661 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650777936.281, "dur": 5.785, "args": { "External id": 18071,"Sequence number": 246699, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 662 } }, { "ph": "f", "id": 69, "pid": 1336757, "tid": 1381170, "ts": 1295650777936.281, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650777937.722, "dur": 4.182, "args": { "External id": 18072,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650777941.042, "dur": 0.721, "args": { "External id": 18073,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 664 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650777948.096, "dur": 174.107, "args": { "External id": 18074,"Record function id": 0, "Sequence number": 246698, "Fwd thread id": 1, "Ev Idx": 665 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650777949.076, "dur": 165.771, "args": { "External id": 18075,"Sequence number": 246698, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 666 } }, { "ph": "f", "id": 70, "pid": 1336757, "tid": 1381170, "ts": 1295650777949.076, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650777951.863, "dur": 4.143, "args": { "External id": 18076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650777953.009, "dur": 2.487, "args": { "External id": 18077,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650777954.634, "dur": 0.700, "args": { "External id": 18078,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650777957.143, "dur": 82.662, "args": { "External id": 18079,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650778044.882, "dur": 5.566, "args": { "External id": 18080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650778046.010, "dur": 3.558, "args": { "External id": 18081,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778048.324, "dur": 1.069, "args": { "External id": 18082,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650778052.195, "dur": 3.510, "args": { "External id": 18083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650778053.151, "dur": 1.908, "args": { "External id": 18084,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778054.615, "dur": 0.382, "args": { "External id": 18085,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650778058.722, "dur": 55.283, "args": { "External id": 18086,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 677 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778129.159, "dur": 7.224, "args": { "External id": 18087,"Record function id": 0, "Sequence number": 246697, "Fwd thread id": 1, "Ev Idx": 678 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778130.421, "dur": 4.630, "args": { "External id": 18088,"Sequence number": 246697, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 679 } }, { "ph": "f", "id": 71, "pid": 1336757, "tid": 1381170, "ts": 1295650778130.421, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650778132.281, "dur": 2.606, "args": { "External id": 18089,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778133.494, "dur": 1.299, "args": { "External id": 18090,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 681 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778139.827, "dur": 7.781, "args": { "External id": 18091,"Record function id": 0, "Sequence number": 246696, "Fwd thread id": 1, "Ev Idx": 682 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778140.820, "dur": 4.770, "args": { "External id": 18092,"Sequence number": 246696, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 683 } }, { "ph": "f", "id": 72, "pid": 1336757, "tid": 1381170, "ts": 1295650778140.820, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650778141.647, "dur": 3.699, "args": { "External id": 18093,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650778142.448, "dur": 2.407, "args": { "External id": 18094,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778144.247, "dur": 0.518, "args": { "External id": 18095,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 686 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650778152.259, "dur": 8.641, "args": { "External id": 18096,"Record function id": 0, "Ev Idx": 687 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650778154.024, "dur": 6.314, "args": { "External id": 18097,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650778155.141, "dur": 4.866, "args": { "External id": 18098,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 689 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650778157.983, "dur": 1.890, "args": { "External id": 18099,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 690 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778164.723, "dur": 6.884, "args": { "External id": 18100,"Record function id": 0, "Sequence number": 246695, "Fwd thread id": 1, "Ev Idx": 691 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778166.346, "dur": 3.397, "args": { "External id": 18101,"Sequence number": 246695, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 692 } }, { "ph": "f", "id": 73, "pid": 1336757, "tid": 1381170, "ts": 1295650778166.346, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650778167.562, "dur": 2.037, "args": { "External id": 18102,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778168.785, "dur": 0.665, "args": { "External id": 18103,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 694 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778174.574, "dur": 139.735, "args": { "External id": 18104,"Record function id": 0, "Sequence number": 246694, "Fwd thread id": 1, "Ev Idx": 695 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778175.231, "dur": 130.115, "args": { "External id": 18105,"Sequence number": 246694, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 696 } }, { "ph": "f", "id": 74, "pid": 1336757, "tid": 1381170, "ts": 1295650778175.231, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650778177.407, "dur": 9.231, "args": { "External id": 18106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650778180.014, "dur": 6.116, "args": { "External id": 18107,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778185.463, "dur": 0.539, "args": { "External id": 18108,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650778187.274, "dur": 35.913, "args": { "External id": 18109,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650778224.320, "dur": 19.403, "args": { "External id": 18110,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650778225.305, "dur": 17.423, "args": { "External id": 18111,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778226.989, "dur": 15.202, "args": { "External id": 18112,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650778247.753, "dur": 5.623, "args": { "External id": 18113,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650778248.614, "dur": 4.158, "args": { "External id": 18114,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778250.806, "dur": 1.896, "args": { "External id": 18115,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650778254.107, "dur": 50.437, "args": { "External id": 18116,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 707 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778320.001, "dur": 30.874, "args": { "External id": 18117,"Record function id": 0, "Sequence number": 246693, "Fwd thread id": 1, "Ev Idx": 708 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778321.068, "dur": 4.201, "args": { "External id": 18118,"Sequence number": 246693, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 709 } }, { "ph": "f", "id": 75, "pid": 1336757, "tid": 1381170, "ts": 1295650778321.068, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650778322.958, "dur": 2.148, "args": { "External id": 18119,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778323.897, "dur": 1.116, "args": { "External id": 18120,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1381170, "ts": 1295650778327.862, "dur": 20.571, "args": { "External id": 18121,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 712 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778354.531, "dur": 10.010, "args": { "External id": 18122,"Record function id": 0, "Sequence number": 246692, "Fwd thread id": 1, "Ev Idx": 713 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778357.873, "dur": 4.414, "args": { "External id": 18123,"Sequence number": 246692, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 714 } }, { "ph": "f", "id": 76, "pid": 1336757, "tid": 1381170, "ts": 1295650778357.873, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650778358.564, "dur": 3.522, "args": { "External id": 18124,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650778359.162, "dur": 2.375, "args": { "External id": 18125,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778360.809, "dur": 0.617, "args": { "External id": 18126,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 717 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650778368.854, "dur": 6.280, "args": { "External id": 18127,"Record function id": 0, "Ev Idx": 718 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650778370.855, "dur": 3.759, "args": { "External id": 18128,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650778371.964, "dur": 2.365, "args": { "External id": 18129,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 720 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650778372.713, "dur": 1.528, "args": { "External id": 18130,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 721 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650778381.416, "dur": 404.618, "args": { "External id": 18131,"Record function id": 0, "Sequence number": 246691, "Fwd thread id": 1, "Ev Idx": 722 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650778382.940, "dur": 372.870, "args": { "External id": 18132,"Sequence number": 246691, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 723 } }, { "ph": "f", "id": 77, "pid": 1336757, "tid": 1381170, "ts": 1295650778382.940, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1381170, "ts": 1295650778406.025, "dur": 33.565, "args": { "External id": 18133,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650778407.541, "dur": 31.822, "args": { "External id": 18134,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650778410.319, "dur": 6.031, "args": { "External id": 18135,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650778412.775, "dur": 3.100, "args": { "External id": 18136,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650778417.712, "dur": 21.084, "args": { "External id": 18137,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650778451.855, "dur": 2.681, "args": { "External id": 18138,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778452.990, "dur": 1.414, "args": { "External id": 18139,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650778457.806, "dur": 4.284, "args": { "External id": 18140,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778458.872, "dur": 3.141, "args": { "External id": 18141,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650778475.654, "dur": 2.429, "args": { "External id": 18142,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650778488.936, "dur": 1.692, "args": { "External id": 18143,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778650.758, "dur": 2.457, "args": { "External id": 18144,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650778657.437, "dur": 31.519, "args": { "External id": 18145,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778666.237, "dur": 0.943, "args": { "External id": 18146,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650778694.121, "dur": 29.659, "args": { "External id": 18147,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650778695.930, "dur": 27.649, "args": { "External id": 18148,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778699.635, "dur": 4.046, "args": { "External id": 18149,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650778706.978, "dur": 16.035, "args": { "External id": 18150,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650778728.006, "dur": 2.462, "args": { "External id": 18151,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778729.382, "dur": 0.935, "args": { "External id": 18152,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650778736.581, "dur": 2.798, "args": { "External id": 18153,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778737.887, "dur": 1.381, "args": { "External id": 18154,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650778741.775, "dur": 3.929, "args": { "External id": 18155,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778743.121, "dur": 2.491, "args": { "External id": 18156,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650778768.297, "dur": 16.111, "args": { "External id": 18157,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 748 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650778795.843, "dur": 8.986, "args": { "External id": 18158,"Record function id": 0, "Ev Idx": 749 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650778798.386, "dur": 5.773, "args": { "External id": 18159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650778800.385, "dur": 2.964, "args": { "External id": 18160,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 751 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650778801.332, "dur": 1.909, "args": { "External id": 18161,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 752 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778808.862, "dur": 8.461, "args": { "External id": 18162,"Record function id": 0, "Sequence number": 246690, "Fwd thread id": 1, "Ev Idx": 753 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778810.543, "dur": 4.295, "args": { "External id": 18163,"Sequence number": 246690, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 754 } }, { "ph": "f", "id": 78, "pid": 1336757, "tid": 1381170, "ts": 1295650778810.543, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650778812.062, "dur": 2.607, "args": { "External id": 18164,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778813.289, "dur": 1.199, "args": { "External id": 18165,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 756 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778823.048, "dur": 115.927, "args": { "External id": 18166,"Record function id": 0, "Sequence number": 246689, "Fwd thread id": 1, "Ev Idx": 757 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778824.195, "dur": 109.622, "args": { "External id": 18167,"Sequence number": 246689, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 758 } }, { "ph": "f", "id": 79, "pid": 1336757, "tid": 1381170, "ts": 1295650778824.195, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650778826.599, "dur": 4.493, "args": { "External id": 18168,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650778827.732, "dur": 2.840, "args": { "External id": 18169,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778829.536, "dur": 0.890, "args": { "External id": 18170,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650778832.110, "dur": 48.799, "args": { "External id": 18171,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650778882.076, "dur": 7.387, "args": { "External id": 18172,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650778885.309, "dur": 3.499, "args": { "External id": 18173,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778886.871, "dur": 1.767, "args": { "External id": 18174,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650778890.876, "dur": 3.698, "args": { "External id": 18175,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650778891.675, "dur": 2.455, "args": { "External id": 18176,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778893.607, "dur": 0.447, "args": { "External id": 18177,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650778895.324, "dur": 37.658, "args": { "External id": 18178,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 769 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778943.876, "dur": 11.012, "args": { "External id": 18179,"Record function id": 0, "Sequence number": 246688, "Fwd thread id": 1, "Ev Idx": 770 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778946.900, "dur": 5.996, "args": { "External id": 18180,"Sequence number": 246688, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 771 } }, { "ph": "f", "id": 80, "pid": 1336757, "tid": 1381170, "ts": 1295650778946.900, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650778948.634, "dur": 4.106, "args": { "External id": 18181,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778950.070, "dur": 2.526, "args": { "External id": 18182,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 773 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778958.577, "dur": 7.591, "args": { "External id": 18183,"Record function id": 0, "Sequence number": 246687, "Fwd thread id": 1, "Ev Idx": 774 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778959.466, "dur": 4.417, "args": { "External id": 18184,"Sequence number": 246687, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 775 } }, { "ph": "f", "id": 81, "pid": 1336757, "tid": 1381170, "ts": 1295650778959.466, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650778960.254, "dur": 3.413, "args": { "External id": 18185,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650778960.758, "dur": 2.389, "args": { "External id": 18186,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650778962.453, "dur": 0.584, "args": { "External id": 18187,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 778 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650778970.255, "dur": 7.229, "args": { "External id": 18188,"Record function id": 0, "Ev Idx": 779 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650778972.084, "dur": 4.897, "args": { "External id": 18189,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650778973.026, "dur": 3.694, "args": { "External id": 18190,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 781 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650778975.712, "dur": 0.934, "args": { "External id": 18191,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 782 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778980.497, "dur": 45.919, "args": { "External id": 18192,"Record function id": 0, "Sequence number": 246686, "Fwd thread id": 1, "Ev Idx": 783 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650778981.330, "dur": 41.738, "args": { "External id": 18193,"Sequence number": 246686, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 784 } }, { "ph": "f", "id": 82, "pid": 1336757, "tid": 1381170, "ts": 1295650778981.330, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650778982.491, "dur": 40.385, "args": { "External id": 18194,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650778983.277, "dur": 39.136, "args": { "External id": 18195,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 786 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650779033.256, "dur": 293.703, "args": { "External id": 18196,"Record function id": 0, "Sequence number": 246685, "Fwd thread id": 1, "Ev Idx": 787 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650779035.108, "dur": 274.189, "args": { "External id": 18197,"Sequence number": 246685, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 788 } }, { "ph": "f", "id": 83, "pid": 1336757, "tid": 1381170, "ts": 1295650779035.108, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650779050.045, "dur": 8.015, "args": { "External id": 18198,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779053.290, "dur": 4.318, "args": { "External id": 18199,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650779059.920, "dur": 4.043, "args": { "External id": 18200,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779061.972, "dur": 1.795, "args": { "External id": 18201,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650779065.356, "dur": 5.447, "args": { "External id": 18202,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779067.336, "dur": 3.276, "args": { "External id": 18203,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 794 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650779095.218, "dur": 187.228, "args": { "External id": 18204,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650779171.905, "dur": 3.231, "args": { "External id": 18205,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650779177.008, "dur": 3.732, "args": { "External id": 18206,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650779296.075, "dur": 4.080, "args": { "External id": 18207,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650779303.068, "dur": 0.791, "args": { "External id": 18208,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650779306.040, "dur": 0.728, "args": { "External id": 18209,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 800 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650779335.776, "dur": 220.084, "args": { "External id": 18210,"Record function id": 0, "Sequence number": 246684, "Fwd thread id": 1, "Ev Idx": 801 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650779338.132, "dur": 211.843, "args": { "External id": 18211,"Sequence number": 246684, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 802 } }, { "ph": "f", "id": 84, "pid": 1336757, "tid": 1381170, "ts": 1295650779338.132, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650779357.130, "dur": 47.118, "args": { "External id": 18212,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779360.364, "dur": 3.282, "args": { "External id": 18213,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650779365.021, "dur": 38.757, "args": { "External id": 18214,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650779413.685, "dur": 4.253, "args": { "External id": 18215,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779415.481, "dur": 2.135, "args": { "External id": 18216,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 807 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650779562.530, "dur": 143.194, "args": { "External id": 18217,"Record function id": 0, "Sequence number": 246683, "Fwd thread id": 1, "Ev Idx": 808 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650779564.795, "dur": 135.983, "args": { "External id": 18218,"Sequence number": 246683, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 809 } }, { "ph": "f", "id": 85, "pid": 1336757, "tid": 1381170, "ts": 1295650779564.795, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650779575.682, "dur": 31.576, "args": { "External id": 18219,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779578.390, "dur": 2.167, "args": { "External id": 18220,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650779581.675, "dur": 25.120, "args": { "External id": 18221,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650779614.350, "dur": 4.283, "args": { "External id": 18222,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779616.216, "dur": 2.160, "args": { "External id": 18223,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 814 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779711.301, "dur": 17.062, "args": { "External id": 18224,"Record function id": 0, "Sequence number": 246682, "Fwd thread id": 1, "Ev Idx": 815 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779715.198, "dur": 10.745, "args": { "External id": 18225,"Sequence number": 246682, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 816 } }, { "ph": "f", "id": 86, "pid": 1336757, "tid": 1381170, "ts": 1295650779715.198, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650779717.989, "dur": 7.707, "args": { "External id": 18226,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650779719.914, "dur": 5.598, "args": { "External id": 18227,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 818 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779731.846, "dur": 6.015, "args": { "External id": 18228,"Record function id": 0, "Sequence number": 246681, "Fwd thread id": 1, "Ev Idx": 819 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779732.856, "dur": 3.518, "args": { "External id": 18229,"Sequence number": 246681, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 820 } }, { "ph": "f", "id": 87, "pid": 1336757, "tid": 1381170, "ts": 1295650779732.856, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650779734.083, "dur": 2.136, "args": { "External id": 18230,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650779735.268, "dur": 0.815, "args": { "External id": 18231,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 822 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779742.842, "dur": 8.554, "args": { "External id": 18232,"Record function id": 0, "Sequence number": 246680, "Fwd thread id": 1, "Ev Idx": 823 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779743.620, "dur": 5.910, "args": { "External id": 18233,"Sequence number": 246680, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 824 } }, { "ph": "f", "id": 88, "pid": 1336757, "tid": 1381170, "ts": 1295650779743.620, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650779745.126, "dur": 4.256, "args": { "External id": 18234,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650779748.435, "dur": 0.815, "args": { "External id": 18235,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 826 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779754.908, "dur": 6.245, "args": { "External id": 18236,"Record function id": 0, "Sequence number": 246679, "Fwd thread id": 1, "Ev Idx": 827 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779756.085, "dur": 3.018, "args": { "External id": 18237,"Sequence number": 246679, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 828 } }, { "ph": "f", "id": 89, "pid": 1336757, "tid": 1381170, "ts": 1295650779756.085, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650779757.071, "dur": 1.905, "args": { "External id": 18238,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650779757.798, "dur": 1.043, "args": { "External id": 18239,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 830 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779764.458, "dur": 142.270, "args": { "External id": 18240,"Record function id": 0, "Sequence number": 246678, "Fwd thread id": 1, "Ev Idx": 831 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779765.371, "dur": 134.621, "args": { "External id": 18241,"Sequence number": 246678, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 832 } }, { "ph": "f", "id": 90, "pid": 1336757, "tid": 1381170, "ts": 1295650779765.371, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650779768.610, "dur": 8.855, "args": { "External id": 18242,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650779770.408, "dur": 6.486, "args": { "External id": 18243,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779775.244, "dur": 1.374, "args": { "External id": 18244,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650779778.814, "dur": 64.252, "args": { "External id": 18245,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650779844.393, "dur": 5.248, "args": { "External id": 18246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650779845.144, "dur": 3.727, "args": { "External id": 18247,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779847.435, "dur": 1.281, "args": { "External id": 18248,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650779851.055, "dur": 6.085, "args": { "External id": 18249,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650779852.144, "dur": 4.530, "args": { "External id": 18250,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779856.250, "dur": 0.358, "args": { "External id": 18251,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650779857.756, "dur": 41.430, "args": { "External id": 18252,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 843 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779911.394, "dur": 6.918, "args": { "External id": 18253,"Record function id": 0, "Sequence number": 246677, "Fwd thread id": 1, "Ev Idx": 844 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779912.302, "dur": 4.329, "args": { "External id": 18254,"Sequence number": 246677, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 845 } }, { "ph": "f", "id": 91, "pid": 1336757, "tid": 1381170, "ts": 1295650779912.302, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650779914.106, "dur": 2.386, "args": { "External id": 18255,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650779915.248, "dur": 1.145, "args": { "External id": 18256,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 847 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779921.818, "dur": 9.415, "args": { "External id": 18257,"Record function id": 0, "Sequence number": 246676, "Fwd thread id": 1, "Ev Idx": 848 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779922.479, "dur": 7.045, "args": { "External id": 18258,"Sequence number": 246676, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 849 } }, { "ph": "f", "id": 92, "pid": 1336757, "tid": 1381170, "ts": 1295650779922.479, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650779923.252, "dur": 6.051, "args": { "External id": 18259,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650779926.038, "dur": 2.741, "args": { "External id": 18260,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779928.056, "dur": 0.649, "args": { "External id": 18261,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 852 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650779937.270, "dur": 9.407, "args": { "External id": 18262,"Record function id": 0, "Ev Idx": 853 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650779938.985, "dur": 6.887, "args": { "External id": 18263,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650779941.341, "dur": 4.168, "args": { "External id": 18264,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 855 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650779942.782, "dur": 2.629, "args": { "External id": 18265,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 856 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779950.056, "dur": 6.676, "args": { "External id": 18266,"Record function id": 0, "Sequence number": 246675, "Fwd thread id": 1, "Ev Idx": 857 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779951.561, "dur": 2.964, "args": { "External id": 18267,"Sequence number": 246675, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 858 } }, { "ph": "f", "id": 93, "pid": 1336757, "tid": 1381170, "ts": 1295650779951.561, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650779952.761, "dur": 1.623, "args": { "External id": 18268,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650779953.478, "dur": 0.812, "args": { "External id": 18269,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 860 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779962.854, "dur": 137.039, "args": { "External id": 18270,"Record function id": 0, "Sequence number": 246674, "Fwd thread id": 1, "Ev Idx": 861 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650779963.816, "dur": 129.368, "args": { "External id": 18271,"Sequence number": 246674, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 862 } }, { "ph": "f", "id": 94, "pid": 1336757, "tid": 1381170, "ts": 1295650779963.816, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650779965.502, "dur": 2.734, "args": { "External id": 18272,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650779966.027, "dur": 1.749, "args": { "External id": 18273,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650779967.357, "dur": 0.302, "args": { "External id": 18274,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650779969.014, "dur": 67.516, "args": { "External id": 18275,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650780039.025, "dur": 8.267, "args": { "External id": 18276,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650780042.896, "dur": 3.571, "args": { "External id": 18277,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650780045.013, "dur": 1.328, "args": { "External id": 18278,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650780048.997, "dur": 5.747, "args": { "External id": 18279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650780050.112, "dur": 4.144, "args": { "External id": 18280,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650780051.660, "dur": 2.505, "args": { "External id": 18281,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650780055.211, "dur": 37.139, "args": { "External id": 18282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 873 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780106.476, "dur": 34.910, "args": { "External id": 18283,"Record function id": 0, "Sequence number": 246673, "Fwd thread id": 1, "Ev Idx": 874 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780109.535, "dur": 4.594, "args": { "External id": 18284,"Sequence number": 246673, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 875 } }, { "ph": "f", "id": 95, "pid": 1336757, "tid": 1381170, "ts": 1295650780109.535, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650780111.192, "dur": 2.775, "args": { "External id": 18285,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650780112.510, "dur": 1.352, "args": { "External id": 18286,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1381170, "ts": 1295650780117.020, "dur": 22.489, "args": { "External id": 18287,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 878 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780145.230, "dur": 9.921, "args": { "External id": 18288,"Record function id": 0, "Sequence number": 246672, "Fwd thread id": 1, "Ev Idx": 879 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780146.785, "dur": 5.943, "args": { "External id": 18289,"Sequence number": 246672, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 880 } }, { "ph": "f", "id": 96, "pid": 1336757, "tid": 1381170, "ts": 1295650780146.785, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650780147.377, "dur": 5.141, "args": { "External id": 18290,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650780148.440, "dur": 3.546, "args": { "External id": 18291,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650780151.399, "dur": 0.429, "args": { "External id": 18292,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 883 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650780159.743, "dur": 7.850, "args": { "External id": 18293,"Record function id": 0, "Ev Idx": 884 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650780161.915, "dur": 5.126, "args": { "External id": 18294,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650780163.532, "dur": 3.132, "args": { "External id": 18295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 886 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650780164.859, "dur": 1.718, "args": { "External id": 18296,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 887 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780170.948, "dur": 6.227, "args": { "External id": 18297,"Record function id": 0, "Sequence number": 246671, "Fwd thread id": 1, "Ev Idx": 888 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780172.481, "dur": 3.364, "args": { "External id": 18298,"Sequence number": 246671, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 889 } }, { "ph": "f", "id": 97, "pid": 1336757, "tid": 1381170, "ts": 1295650780172.481, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650780173.798, "dur": 1.905, "args": { "External id": 18299,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650780174.606, "dur": 0.999, "args": { "External id": 18300,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 891 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780182.674, "dur": 118.228, "args": { "External id": 18301,"Record function id": 0, "Sequence number": 246670, "Fwd thread id": 1, "Ev Idx": 892 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780185.779, "dur": 107.104, "args": { "External id": 18302,"Sequence number": 246670, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 893 } }, { "ph": "f", "id": 98, "pid": 1336757, "tid": 1381170, "ts": 1295650780185.779, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650780187.991, "dur": 3.199, "args": { "External id": 18303,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650780188.402, "dur": 2.327, "args": { "External id": 18304,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650780190.078, "dur": 0.546, "args": { "External id": 18305,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650780191.999, "dur": 28.724, "args": { "External id": 18306,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650780221.739, "dur": 5.636, "args": { "External id": 18307,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650780222.451, "dur": 4.384, "args": { "External id": 18308,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650780225.650, "dur": 1.070, "args": { "External id": 18309,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650780243.063, "dur": 7.948, "args": { "External id": 18310,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650780247.586, "dur": 2.752, "args": { "External id": 18311,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650780249.514, "dur": 0.703, "args": { "External id": 18312,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650780251.666, "dur": 40.551, "args": { "External id": 18313,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 904 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780307.063, "dur": 30.343, "args": { "External id": 18314,"Record function id": 0, "Sequence number": 246669, "Fwd thread id": 1, "Ev Idx": 905 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780308.051, "dur": 7.697, "args": { "External id": 18315,"Sequence number": 246669, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 906 } }, { "ph": "f", "id": 99, "pid": 1336757, "tid": 1381170, "ts": 1295650780308.051, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650780312.810, "dur": 2.781, "args": { "External id": 18316,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650780314.094, "dur": 1.400, "args": { "External id": 18317,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650780318.423, "dur": 16.726, "args": { "External id": 18318,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 909 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780341.091, "dur": 7.825, "args": { "External id": 18319,"Record function id": 0, "Sequence number": 246668, "Fwd thread id": 1, "Ev Idx": 910 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780342.251, "dur": 4.730, "args": { "External id": 18320,"Sequence number": 246668, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 911 } }, { "ph": "f", "id": 100, "pid": 1336757, "tid": 1381170, "ts": 1295650780342.251, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650780342.982, "dur": 3.782, "args": { "External id": 18321,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650780343.638, "dur": 2.559, "args": { "External id": 18322,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650780345.270, "dur": 0.785, "args": { "External id": 18323,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 914 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650780353.468, "dur": 8.663, "args": { "External id": 18324,"Record function id": 0, "Ev Idx": 915 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650780355.543, "dur": 6.071, "args": { "External id": 18325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650780356.883, "dur": 4.389, "args": { "External id": 18326,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 917 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650780359.776, "dur": 1.406, "args": { "External id": 18327,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 918 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650780366.614, "dur": 340.897, "args": { "External id": 18328,"Record function id": 0, "Sequence number": 246667, "Fwd thread id": 1, "Ev Idx": 919 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650780368.329, "dur": 307.645, "args": { "External id": 18329,"Sequence number": 246667, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 920 } }, { "ph": "f", "id": 101, "pid": 1336757, "tid": 1381170, "ts": 1295650780368.329, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650780399.636, "dur": 2.040, "args": { "External id": 18330,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650780400.599, "dur": 0.935, "args": { "External id": 18331,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650780415.534, "dur": 5.901, "args": { "External id": 18332,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650780432.077, "dur": 2.212, "args": { "External id": 18333,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650780570.994, "dur": 1.751, "args": { "External id": 18334,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650780577.019, "dur": 35.086, "args": { "External id": 18335,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650780587.449, "dur": 0.990, "args": { "External id": 18336,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650780621.356, "dur": 31.227, "args": { "External id": 18337,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650780623.273, "dur": 29.100, "args": { "External id": 18338,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650780627.779, "dur": 5.486, "args": { "External id": 18339,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650780634.836, "dur": 16.978, "args": { "External id": 18340,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650780659.122, "dur": 2.768, "args": { "External id": 18341,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650780660.618, "dur": 1.147, "args": { "External id": 18342,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650780667.521, "dur": 2.048, "args": { "External id": 18343,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650780668.458, "dur": 1.025, "args": { "External id": 18344,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650780684.383, "dur": 19.426, "args": { "External id": 18345,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 936 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650780716.696, "dur": 11.338, "args": { "External id": 18346,"Record function id": 0, "Ev Idx": 937 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650780719.304, "dur": 8.036, "args": { "External id": 18347,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650780720.816, "dur": 5.559, "args": { "External id": 18348,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 939 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650780724.662, "dur": 1.619, "args": { "External id": 18349,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 940 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780731.650, "dur": 4.975, "args": { "External id": 18350,"Record function id": 0, "Sequence number": 246666, "Fwd thread id": 1, "Ev Idx": 941 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650780732.991, "dur": 0.958, "args": { "External id": 18351,"Sequence number": 246666, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 942 } }, { "ph": "f", "id": 102, "pid": 1336757, "tid": 1381170, "ts": 1295650780732.991, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650780740.527, "dur": 461.840, "args": { "External id": 18352,"Record function id": 0, "Sequence number": 246665, "Fwd thread id": 1, "Ev Idx": 943 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650780742.226, "dur": 448.789, "args": { "External id": 18353,"Sequence number": 246665, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 944 } }, { "ph": "f", "id": 103, "pid": 1336757, "tid": 1381170, "ts": 1295650780742.226, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650780767.131, "dur": 7.870, "args": { "External id": 18354,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336757, "tid": 1381170, "ts": 1295650780772.026, "dur": 2.736, "args": { "External id": 18355,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650780777.942, "dur": 7.077, "args": { "External id": 18356,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650780781.736, "dur": 2.767, "args": { "External id": 18357,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650780783.848, "dur": 0.519, "args": { "External id": 18358,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1381170, "ts": 1295650780788.627, "dur": 94.715, "args": { "External id": 18359,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650780789.319, "dur": 3.960, "args": { "External id": 18360,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650780789.829, "dur": 3.026, "args": { "External id": 18361,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650780791.239, "dur": 1.510, "args": { "External id": 18362,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1381170, "ts": 1295650780796.622, "dur": 86.107, "args": { "External id": 18363,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650780797.969, "dur": 83.883, "args": { "External id": 18364,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650780886.827, "dur": 2.897, "args": { "External id": 18365,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650780888.264, "dur": 1.328, "args": { "External id": 18366,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650780919.254, "dur": 4.647, "args": { "External id": 18367,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650780925.269, "dur": 1.693, "args": { "External id": 18368,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650780928.449, "dur": 1.509, "args": { "External id": 18369,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650780963.422, "dur": 2.700, "args": { "External id": 18370,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650780964.429, "dur": 1.558, "args": { "External id": 18371,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336757, "tid": 1381170, "ts": 1295650781025.876, "dur": 146.429, "args": { "External id": 18372,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1381170, "ts": 1295650781031.468, "dur": 6.448, "args": { "External id": 18373,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781035.762, "dur": 1.114, "args": { "External id": 18374,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650781039.946, "dur": 8.036, "args": { "External id": 18375,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781044.977, "dur": 2.328, "args": { "External id": 18376,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1381170, "ts": 1295650781049.519, "dur": 2.581, "args": { "External id": 18377,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781051.388, "dur": 0.365, "args": { "External id": 18378,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650781052.827, "dur": 3.075, "args": { "External id": 18379,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781055.123, "dur": 0.376, "args": { "External id": 18380,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650781061.900, "dur": 2.969, "args": { "External id": 18381,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781064.221, "dur": 0.330, "args": { "External id": 18382,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650781066.308, "dur": 6.499, "args": { "External id": 18383,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336757, "tid": 1381170, "ts": 1295650781070.621, "dur": 2.007, "args": { "External id": 18384,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650781074.228, "dur": 2.908, "args": { "External id": 18385,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781076.416, "dur": 0.398, "args": { "External id": 18386,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650781078.373, "dur": 3.450, "args": { "External id": 18387,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650781079.330, "dur": 2.396, "args": { "External id": 18388,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295650781083.273, "dur": 73.665, "args": { "External id": 18389,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650781160.958, "dur": 2.529, "args": { "External id": 18390,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650781164.879, "dur": 3.174, "args": { "External id": 18391,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781167.213, "dur": 0.466, "args": { "External id": 18392,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650781170.344, "dur": 0.865, "args": { "External id": 18393,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 984 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650781215.015, "dur": 9.679, "args": { "External id": 18394,"Record function id": 0, "Ev Idx": 985 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650781217.560, "dur": 6.409, "args": { "External id": 18395,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650781219.599, "dur": 3.653, "args": { "External id": 18396,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 987 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650781220.751, "dur": 2.396, "args": { "External id": 18397,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 988 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781245.367, "dur": 10.383, "args": { "External id": 18398,"Record function id": 0, "Sequence number": 246664, "Fwd thread id": 1, "Ev Idx": 989 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781247.519, "dur": 5.227, "args": { "External id": 18399,"Sequence number": 246664, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 990 } }, { "ph": "f", "id": 104, "pid": 1336757, "tid": 1381170, "ts": 1295650781247.519, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650781249.695, "dur": 2.835, "args": { "External id": 18400,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650781250.687, "dur": 1.600, "args": { "External id": 18401,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 992 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781262.472, "dur": 176.492, "args": { "External id": 18402,"Record function id": 0, "Sequence number": 246663, "Fwd thread id": 1, "Ev Idx": 993 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781263.303, "dur": 169.640, "args": { "External id": 18403,"Sequence number": 246663, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 994 } }, { "ph": "f", "id": 105, "pid": 1336757, "tid": 1381170, "ts": 1295650781263.303, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650781266.490, "dur": 4.452, "args": { "External id": 18404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650781267.814, "dur": 2.580, "args": { "External id": 18405,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781269.589, "dur": 0.591, "args": { "External id": 18406,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650781272.016, "dur": 61.411, "args": { "External id": 18407,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650781334.466, "dur": 6.176, "args": { "External id": 18408,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650781335.322, "dur": 4.479, "args": { "External id": 18409,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781338.681, "dur": 0.969, "args": { "External id": 18410,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650781342.549, "dur": 4.128, "args": { "External id": 18411,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650781343.550, "dur": 2.488, "args": { "External id": 18412,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781345.422, "dur": 0.489, "args": { "External id": 18413,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650781347.343, "dur": 84.791, "args": { "External id": 18414,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1005 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781443.469, "dur": 8.780, "args": { "External id": 18415,"Record function id": 0, "Sequence number": 246662, "Fwd thread id": 1, "Ev Idx": 1006 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781444.414, "dur": 6.492, "args": { "External id": 18416,"Sequence number": 246662, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1007 } }, { "ph": "f", "id": 106, "pid": 1336757, "tid": 1381170, "ts": 1295650781444.414, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650781446.330, "dur": 4.412, "args": { "External id": 18417,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650781449.428, "dur": 1.198, "args": { "External id": 18418,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1009 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781455.757, "dur": 8.114, "args": { "External id": 18419,"Record function id": 0, "Sequence number": 246661, "Fwd thread id": 1, "Ev Idx": 1010 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781456.658, "dur": 5.312, "args": { "External id": 18420,"Sequence number": 246661, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1011 } }, { "ph": "f", "id": 107, "pid": 1336757, "tid": 1381170, "ts": 1295650781456.658, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650781458.022, "dur": 3.739, "args": { "External id": 18421,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650781458.979, "dur": 2.258, "args": { "External id": 18422,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781460.717, "dur": 0.412, "args": { "External id": 18423,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1014 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650781468.021, "dur": 6.371, "args": { "External id": 18424,"Record function id": 0, "Ev Idx": 1015 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650781470.155, "dur": 3.678, "args": { "External id": 18425,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650781471.308, "dur": 2.257, "args": { "External id": 18426,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1017 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650781472.022, "dur": 1.451, "args": { "External id": 18427,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1018 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781479.697, "dur": 8.240, "args": { "External id": 18428,"Record function id": 0, "Sequence number": 246660, "Fwd thread id": 1, "Ev Idx": 1019 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781481.217, "dur": 4.746, "args": { "External id": 18429,"Sequence number": 246660, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 1020 } }, { "ph": "f", "id": 108, "pid": 1336757, "tid": 1381170, "ts": 1295650781481.217, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650781483.957, "dur": 1.838, "args": { "External id": 18430,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650781485.000, "dur": 0.658, "args": { "External id": 18431,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1022 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781490.936, "dur": 186.378, "args": { "External id": 18432,"Record function id": 0, "Sequence number": 246659, "Fwd thread id": 1, "Ev Idx": 1023 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781514.754, "dur": 155.454, "args": { "External id": 18433,"Sequence number": 246659, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1024 } }, { "ph": "f", "id": 109, "pid": 1336757, "tid": 1381170, "ts": 1295650781514.754, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650781516.769, "dur": 4.963, "args": { "External id": 18434,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650781517.321, "dur": 3.921, "args": { "External id": 18435,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 1026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781520.596, "dur": 0.536, "args": { "External id": 18436,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650781522.378, "dur": 51.434, "args": { "External id": 18437,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 1028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650781574.924, "dur": 4.313, "args": { "External id": 18438,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650781575.417, "dur": 3.216, "args": { "External id": 18439,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781576.958, "dur": 1.535, "args": { "External id": 18440,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650781580.341, "dur": 6.040, "args": { "External id": 18441,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650781580.935, "dur": 4.994, "args": { "External id": 18442,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781583.985, "dur": 1.880, "args": { "External id": 18443,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650781586.978, "dur": 82.545, "args": { "External id": 18444,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1035 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781681.951, "dur": 32.085, "args": { "External id": 18445,"Record function id": 0, "Sequence number": 246658, "Fwd thread id": 1, "Ev Idx": 1036 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781682.796, "dur": 3.422, "args": { "External id": 18446,"Sequence number": 246658, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1037 } }, { "ph": "f", "id": 110, "pid": 1336757, "tid": 1381170, "ts": 1295650781682.796, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650781684.258, "dur": 1.819, "args": { "External id": 18447,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650781685.059, "dur": 0.927, "args": { "External id": 18448,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1381170, "ts": 1295650781689.077, "dur": 22.018, "args": { "External id": 18449,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1040 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781717.698, "dur": 9.422, "args": { "External id": 18450,"Record function id": 0, "Sequence number": 246657, "Fwd thread id": 1, "Ev Idx": 1041 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650781718.599, "dur": 6.563, "args": { "External id": 18451,"Sequence number": 246657, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1042 } }, { "ph": "f", "id": 111, "pid": 1336757, "tid": 1381170, "ts": 1295650781718.599, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650781721.358, "dur": 3.606, "args": { "External id": 18452,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650781721.946, "dur": 2.484, "args": { "External id": 18453,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650781723.831, "dur": 0.478, "args": { "External id": 18454,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1045 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650781731.044, "dur": 4.839, "args": { "External id": 18455,"Record function id": 0, "Ev Idx": 1046 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650781732.717, "dur": 2.700, "args": { "External id": 18456,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650781733.542, "dur": 1.601, "args": { "External id": 18457,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1048 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650781733.995, "dur": 1.071, "args": { "External id": 18458,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1049 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650781740.398, "dur": 458.974, "args": { "External id": 18459,"Record function id": 0, "Sequence number": 246656, "Fwd thread id": 1, "Ev Idx": 1050 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650781742.189, "dur": 422.994, "args": { "External id": 18460,"Sequence number": 246656, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 1051 } }, { "ph": "f", "id": 112, "pid": 1336757, "tid": 1381170, "ts": 1295650781742.189, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1381170, "ts": 1295650781765.194, "dur": 36.673, "args": { "External id": 18461,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650781766.457, "dur": 35.179, "args": { "External id": 18462,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650781768.936, "dur": 5.779, "args": { "External id": 18463,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 1054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650781771.509, "dur": 2.741, "args": { "External id": 18464,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650781776.056, "dur": 25.022, "args": { "External id": 18465,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650781815.166, "dur": 1.964, "args": { "External id": 18466,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650781815.832, "dur": 1.140, "args": { "External id": 18467,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650781820.663, "dur": 2.815, "args": { "External id": 18468,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650781821.512, "dur": 1.833, "args": { "External id": 18469,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650781837.360, "dur": 2.265, "args": { "External id": 18470,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650781850.462, "dur": 1.894, "args": { "External id": 18471,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650782051.297, "dur": 3.806, "args": { "External id": 18472,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650782059.232, "dur": 35.865, "args": { "External id": 18473,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782070.244, "dur": 0.919, "args": { "External id": 18474,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650782100.838, "dur": 31.576, "args": { "External id": 18475,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650782102.567, "dur": 29.647, "args": { "External id": 18476,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782107.207, "dur": 4.145, "args": { "External id": 18477,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650782114.568, "dur": 17.140, "args": { "External id": 18478,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650782136.852, "dur": 2.502, "args": { "External id": 18479,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650782138.140, "dur": 1.091, "args": { "External id": 18480,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650782145.792, "dur": 2.504, "args": { "External id": 18481,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650782146.859, "dur": 1.286, "args": { "External id": 18482,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650782150.607, "dur": 3.445, "args": { "External id": 18483,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650782151.625, "dur": 2.338, "args": { "External id": 18484,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650782179.936, "dur": 17.780, "args": { "External id": 18485,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1076 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650782212.208, "dur": 9.902, "args": { "External id": 18486,"Record function id": 0, "Ev Idx": 1077 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650782215.417, "dur": 6.082, "args": { "External id": 18487,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650782217.604, "dur": 3.065, "args": { "External id": 18488,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1079 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650782218.495, "dur": 2.053, "args": { "External id": 18489,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1080 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650782226.564, "dur": 25.356, "args": { "External id": 18490,"Record function id": 0, "Sequence number": 246655, "Fwd thread id": 1, "Ev Idx": 1081 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650782242.711, "dur": 5.710, "args": { "External id": 18491,"Sequence number": 246655, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1082 } }, { "ph": "f", "id": 113, "pid": 1336757, "tid": 1381170, "ts": 1295650782242.711, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650782244.547, "dur": 3.683, "args": { "External id": 18492,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650782245.611, "dur": 2.297, "args": { "External id": 18493,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1084 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650782259.378, "dur": 126.905, "args": { "External id": 18494,"Record function id": 0, "Sequence number": 246654, "Fwd thread id": 1, "Ev Idx": 1085 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650782260.272, "dur": 119.939, "args": { "External id": 18495,"Sequence number": 246654, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1086 } }, { "ph": "f", "id": 114, "pid": 1336757, "tid": 1381170, "ts": 1295650782260.272, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650782263.009, "dur": 5.504, "args": { "External id": 18496,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650782264.397, "dur": 3.443, "args": { "External id": 18497,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782266.804, "dur": 0.839, "args": { "External id": 18498,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650782269.480, "dur": 57.843, "args": { "External id": 18499,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650782328.523, "dur": 7.119, "args": { "External id": 18500,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650782331.203, "dur": 3.688, "args": { "External id": 18501,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782333.350, "dur": 1.380, "args": { "External id": 18502,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650782337.094, "dur": 3.371, "args": { "External id": 18503,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650782338.067, "dur": 1.936, "args": { "External id": 18504,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782339.514, "dur": 0.376, "args": { "External id": 18505,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650782341.152, "dur": 38.231, "args": { "External id": 18506,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1097 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650782390.869, "dur": 10.274, "args": { "External id": 18507,"Record function id": 0, "Sequence number": 246653, "Fwd thread id": 1, "Ev Idx": 1098 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650782391.926, "dur": 7.210, "args": { "External id": 18508,"Sequence number": 246653, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1099 } }, { "ph": "f", "id": 115, "pid": 1336757, "tid": 1381170, "ts": 1295650782391.926, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650782395.607, "dur": 3.389, "args": { "External id": 18509,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650782396.505, "dur": 2.388, "args": { "External id": 18510,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1101 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650782404.848, "dur": 7.008, "args": { "External id": 18511,"Record function id": 0, "Sequence number": 246652, "Fwd thread id": 1, "Ev Idx": 1102 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650782405.678, "dur": 4.443, "args": { "External id": 18512,"Sequence number": 246652, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1103 } }, { "ph": "f", "id": 116, "pid": 1336757, "tid": 1381170, "ts": 1295650782405.678, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650782406.479, "dur": 3.430, "args": { "External id": 18513,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650782407.174, "dur": 2.204, "args": { "External id": 18514,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782408.831, "dur": 0.427, "args": { "External id": 18515,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1106 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650782416.090, "dur": 8.889, "args": { "External id": 18516,"Record function id": 0, "Ev Idx": 1107 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650782417.970, "dur": 6.457, "args": { "External id": 18517,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650782419.057, "dur": 5.059, "args": { "External id": 18518,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1109 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650782422.538, "dur": 1.450, "args": { "External id": 18519,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1110 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650782430.113, "dur": 6.357, "args": { "External id": 18520,"Record function id": 0, "Sequence number": 246651, "Fwd thread id": 1, "Ev Idx": 1111 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650782430.966, "dur": 3.798, "args": { "External id": 18521,"Sequence number": 246651, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1112 } }, { "ph": "f", "id": 117, "pid": 1336757, "tid": 1381170, "ts": 1295650782430.966, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650782432.104, "dur": 2.513, "args": { "External id": 18522,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650782433.121, "dur": 1.339, "args": { "External id": 18523,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1114 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650782440.698, "dur": 275.194, "args": { "External id": 18524,"Record function id": 0, "Sequence number": 246650, "Fwd thread id": 1, "Ev Idx": 1115 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650782442.335, "dur": 256.783, "args": { "External id": 18525,"Sequence number": 246650, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1116 } }, { "ph": "f", "id": 118, "pid": 1336757, "tid": 1381170, "ts": 1295650782442.335, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650782456.611, "dur": 6.840, "args": { "External id": 18526,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782459.543, "dur": 3.512, "args": { "External id": 18527,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650782465.509, "dur": 4.720, "args": { "External id": 18528,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782467.033, "dur": 3.001, "args": { "External id": 18529,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650782480.443, "dur": 5.411, "args": { "External id": 18530,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782484.157, "dur": 1.506, "args": { "External id": 18531,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1122 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650782510.016, "dur": 164.855, "args": { "External id": 18532,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650782583.492, "dur": 4.036, "args": { "External id": 18533,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650782589.511, "dur": 3.243, "args": { "External id": 18534,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650782686.932, "dur": 3.281, "args": { "External id": 18535,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650782693.161, "dur": 0.583, "args": { "External id": 18536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650782696.043, "dur": 0.731, "args": { "External id": 18537,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1128 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650782722.879, "dur": 215.264, "args": { "External id": 18538,"Record function id": 0, "Sequence number": 246649, "Fwd thread id": 1, "Ev Idx": 1129 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650782724.649, "dur": 207.278, "args": { "External id": 18539,"Sequence number": 246649, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1130 } }, { "ph": "f", "id": 119, "pid": 1336757, "tid": 1381170, "ts": 1295650782724.649, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650782742.624, "dur": 43.941, "args": { "External id": 18540,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782746.104, "dur": 2.736, "args": { "External id": 18541,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650782750.127, "dur": 35.666, "args": { "External id": 18542,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650782795.598, "dur": 4.333, "args": { "External id": 18543,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782797.397, "dur": 2.258, "args": { "External id": 18544,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1135 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650782944.865, "dur": 213.976, "args": { "External id": 18545,"Record function id": 0, "Sequence number": 246648, "Fwd thread id": 1, "Ev Idx": 1136 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650782946.846, "dur": 205.294, "args": { "External id": 18546,"Sequence number": 246648, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1137 } }, { "ph": "f", "id": 120, "pid": 1336757, "tid": 1381170, "ts": 1295650782946.846, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650782959.158, "dur": 85.385, "args": { "External id": 18547,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650782961.666, "dur": 2.361, "args": { "External id": 18548,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650782968.752, "dur": 74.959, "args": { "External id": 18549,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650783054.269, "dur": 5.501, "args": { "External id": 18550,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783056.473, "dur": 2.968, "args": { "External id": 18551,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1142 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783169.073, "dur": 15.383, "args": { "External id": 18552,"Record function id": 0, "Sequence number": 246647, "Fwd thread id": 1, "Ev Idx": 1143 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783170.689, "dur": 11.153, "args": { "External id": 18553,"Sequence number": 246647, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1144 } }, { "ph": "f", "id": 121, "pid": 1336757, "tid": 1381170, "ts": 1295650783170.689, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650783173.253, "dur": 8.303, "args": { "External id": 18554,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650783174.702, "dur": 6.718, "args": { "External id": 18555,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1146 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783187.775, "dur": 6.573, "args": { "External id": 18556,"Record function id": 0, "Sequence number": 246646, "Fwd thread id": 1, "Ev Idx": 1147 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783188.680, "dur": 3.673, "args": { "External id": 18557,"Sequence number": 246646, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1148 } }, { "ph": "f", "id": 122, "pid": 1336757, "tid": 1381170, "ts": 1295650783188.680, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650783190.324, "dur": 1.877, "args": { "External id": 18558,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650783191.237, "dur": 0.872, "args": { "External id": 18559,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1150 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783197.974, "dur": 8.282, "args": { "External id": 18560,"Record function id": 0, "Sequence number": 246645, "Fwd thread id": 1, "Ev Idx": 1151 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783198.704, "dur": 5.549, "args": { "External id": 18561,"Sequence number": 246645, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1152 } }, { "ph": "f", "id": 123, "pid": 1336757, "tid": 1381170, "ts": 1295650783198.704, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650783202.100, "dur": 2.008, "args": { "External id": 18562,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650783203.063, "dur": 0.914, "args": { "External id": 18563,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1154 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783209.744, "dur": 7.216, "args": { "External id": 18564,"Record function id": 0, "Sequence number": 246644, "Fwd thread id": 1, "Ev Idx": 1155 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783211.172, "dur": 3.218, "args": { "External id": 18565,"Sequence number": 246644, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1156 } }, { "ph": "f", "id": 124, "pid": 1336757, "tid": 1381170, "ts": 1295650783211.172, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650783212.430, "dur": 1.830, "args": { "External id": 18566,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650783213.331, "dur": 0.834, "args": { "External id": 18567,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1158 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783220.040, "dur": 169.489, "args": { "External id": 18568,"Record function id": 0, "Sequence number": 246643, "Fwd thread id": 1, "Ev Idx": 1159 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783220.875, "dur": 160.409, "args": { "External id": 18569,"Sequence number": 246643, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1160 } }, { "ph": "f", "id": 125, "pid": 1336757, "tid": 1381170, "ts": 1295650783220.875, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783224.281, "dur": 29.950, "args": { "External id": 18570,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783247.745, "dur": 5.550, "args": { "External id": 18571,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783251.170, "dur": 1.627, "args": { "External id": 18572,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650783255.830, "dur": 68.668, "args": { "External id": 18573,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783325.763, "dur": 5.175, "args": { "External id": 18574,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783326.726, "dur": 3.382, "args": { "External id": 18575,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783328.857, "dur": 1.121, "args": { "External id": 18576,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783332.679, "dur": 5.938, "args": { "External id": 18577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783336.463, "dur": 1.670, "args": { "External id": 18578,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783337.763, "dur": 0.282, "args": { "External id": 18579,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650783339.349, "dur": 41.226, "args": { "External id": 18580,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1171 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783397.846, "dur": 7.648, "args": { "External id": 18581,"Record function id": 0, "Sequence number": 246642, "Fwd thread id": 1, "Ev Idx": 1172 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783398.999, "dur": 4.570, "args": { "External id": 18582,"Sequence number": 246642, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1173 } }, { "ph": "f", "id": 126, "pid": 1336757, "tid": 1381170, "ts": 1295650783398.999, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650783400.816, "dur": 2.606, "args": { "External id": 18583,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650783402.051, "dur": 1.259, "args": { "External id": 18584,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1175 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783408.829, "dur": 9.989, "args": { "External id": 18585,"Record function id": 0, "Sequence number": 246641, "Fwd thread id": 1, "Ev Idx": 1176 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783409.568, "dur": 7.094, "args": { "External id": 18586,"Sequence number": 246641, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1177 } }, { "ph": "f", "id": 127, "pid": 1336757, "tid": 1381170, "ts": 1295650783409.568, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783412.739, "dur": 3.689, "args": { "External id": 18587,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783413.448, "dur": 2.471, "args": { "External id": 18588,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783415.422, "dur": 0.396, "args": { "External id": 18589,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1180 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650783425.101, "dur": 9.440, "args": { "External id": 18590,"Record function id": 0, "Ev Idx": 1181 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650783427.188, "dur": 6.594, "args": { "External id": 18591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650783429.708, "dur": 3.764, "args": { "External id": 18592,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1183 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650783430.724, "dur": 2.663, "args": { "External id": 18593,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1184 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783438.268, "dur": 8.636, "args": { "External id": 18594,"Record function id": 0, "Sequence number": 246640, "Fwd thread id": 1, "Ev Idx": 1185 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783439.840, "dur": 4.833, "args": { "External id": 18595,"Sequence number": 246640, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1186 } }, { "ph": "f", "id": 128, "pid": 1336757, "tid": 1381170, "ts": 1295650783439.840, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650783440.860, "dur": 3.659, "args": { "External id": 18596,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650783443.678, "dur": 0.748, "args": { "External id": 18597,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1188 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783450.181, "dur": 89.487, "args": { "External id": 18598,"Record function id": 0, "Sequence number": 246639, "Fwd thread id": 1, "Ev Idx": 1189 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783450.984, "dur": 83.215, "args": { "External id": 18599,"Sequence number": 246639, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1190 } }, { "ph": "f", "id": 129, "pid": 1336757, "tid": 1381170, "ts": 1295650783450.984, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783453.154, "dur": 2.550, "args": { "External id": 18600,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783453.638, "dur": 1.626, "args": { "External id": 18601,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783454.844, "dur": 0.326, "args": { "External id": 18602,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650783456.468, "dur": 26.392, "args": { "External id": 18603,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783486.264, "dur": 3.955, "args": { "External id": 18604,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783487.002, "dur": 2.609, "args": { "External id": 18605,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783488.737, "dur": 0.747, "args": { "External id": 18606,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783491.211, "dur": 5.313, "args": { "External id": 18607,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783492.275, "dur": 3.803, "args": { "External id": 18608,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783493.530, "dur": 2.410, "args": { "External id": 18609,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650783499.410, "dur": 34.186, "args": { "External id": 18610,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1201 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783544.122, "dur": 32.389, "args": { "External id": 18611,"Record function id": 0, "Sequence number": 246638, "Fwd thread id": 1, "Ev Idx": 1202 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783545.153, "dur": 4.281, "args": { "External id": 18612,"Sequence number": 246638, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1203 } }, { "ph": "f", "id": 130, "pid": 1336757, "tid": 1381170, "ts": 1295650783545.153, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650783546.616, "dur": 2.672, "args": { "External id": 18613,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650783547.989, "dur": 1.205, "args": { "External id": 18614,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1381170, "ts": 1295650783552.311, "dur": 22.087, "args": { "External id": 18615,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1206 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783580.123, "dur": 9.615, "args": { "External id": 18616,"Record function id": 0, "Sequence number": 246637, "Fwd thread id": 1, "Ev Idx": 1207 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783581.139, "dur": 6.738, "args": { "External id": 18617,"Sequence number": 246637, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1208 } }, { "ph": "f", "id": 131, "pid": 1336757, "tid": 1381170, "ts": 1295650783581.139, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783582.047, "dur": 5.627, "args": { "External id": 18618,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783584.870, "dur": 2.269, "args": { "External id": 18619,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783586.553, "dur": 0.437, "args": { "External id": 18620,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1211 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650783593.864, "dur": 5.346, "args": { "External id": 18621,"Record function id": 0, "Ev Idx": 1212 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650783595.463, "dur": 3.226, "args": { "External id": 18622,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650783596.657, "dur": 1.733, "args": { "External id": 18623,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1214 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650783597.285, "dur": 1.005, "args": { "External id": 18624,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1215 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783602.683, "dur": 9.302, "args": { "External id": 18625,"Record function id": 0, "Sequence number": 246636, "Fwd thread id": 1, "Ev Idx": 1216 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783604.064, "dur": 5.642, "args": { "External id": 18626,"Sequence number": 246636, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1217 } }, { "ph": "f", "id": 132, "pid": 1336757, "tid": 1381170, "ts": 1295650783604.064, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650783605.154, "dur": 4.398, "args": { "External id": 18627,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650783608.684, "dur": 0.762, "args": { "External id": 18628,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1219 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783617.410, "dur": 86.760, "args": { "External id": 18629,"Record function id": 0, "Sequence number": 246635, "Fwd thread id": 1, "Ev Idx": 1220 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783618.553, "dur": 78.817, "args": { "External id": 18630,"Sequence number": 246635, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1221 } }, { "ph": "f", "id": 133, "pid": 1336757, "tid": 1381170, "ts": 1295650783618.553, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783620.677, "dur": 3.318, "args": { "External id": 18631,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783621.150, "dur": 2.373, "args": { "External id": 18632,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783623.035, "dur": 0.377, "args": { "External id": 18633,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650783624.553, "dur": 27.202, "args": { "External id": 18634,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783652.755, "dur": 5.977, "args": { "External id": 18635,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783655.338, "dur": 2.732, "args": { "External id": 18636,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783656.830, "dur": 1.078, "args": { "External id": 18637,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783659.781, "dur": 3.608, "args": { "External id": 18638,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783661.152, "dur": 1.833, "args": { "External id": 18639,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783662.633, "dur": 0.248, "args": { "External id": 18640,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650783664.229, "dur": 32.490, "args": { "External id": 18641,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1232 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783708.489, "dur": 25.274, "args": { "External id": 18642,"Record function id": 0, "Sequence number": 246634, "Fwd thread id": 1, "Ev Idx": 1233 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783709.549, "dur": 5.702, "args": { "External id": 18643,"Sequence number": 246634, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1234 } }, { "ph": "f", "id": 134, "pid": 1336757, "tid": 1381170, "ts": 1295650783709.549, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650783712.951, "dur": 2.155, "args": { "External id": 18644,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650783713.971, "dur": 1.024, "args": { "External id": 18645,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650783717.250, "dur": 14.476, "args": { "External id": 18646,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1237 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783737.421, "dur": 7.615, "args": { "External id": 18647,"Record function id": 0, "Sequence number": 246633, "Fwd thread id": 1, "Ev Idx": 1238 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650783738.345, "dur": 4.884, "args": { "External id": 18648,"Sequence number": 246633, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1239 } }, { "ph": "f", "id": 135, "pid": 1336757, "tid": 1381170, "ts": 1295650783738.345, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650783739.303, "dur": 3.717, "args": { "External id": 18649,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650783740.036, "dur": 2.470, "args": { "External id": 18650,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783741.936, "dur": 0.466, "args": { "External id": 18651,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1242 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650783748.946, "dur": 7.690, "args": { "External id": 18652,"Record function id": 0, "Ev Idx": 1243 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650783750.672, "dur": 5.508, "args": { "External id": 18653,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650783751.649, "dur": 4.227, "args": { "External id": 18654,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1245 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650783754.649, "dur": 1.151, "args": { "External id": 18655,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1246 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650783763.383, "dur": 374.298, "args": { "External id": 18656,"Record function id": 0, "Sequence number": 246632, "Fwd thread id": 1, "Ev Idx": 1247 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650783765.110, "dur": 340.928, "args": { "External id": 18657,"Sequence number": 246632, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1248 } }, { "ph": "f", "id": 136, "pid": 1336757, "tid": 1381170, "ts": 1295650783765.110, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650783792.861, "dur": 2.084, "args": { "External id": 18658,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650783793.678, "dur": 1.123, "args": { "External id": 18659,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650783807.135, "dur": 4.879, "args": { "External id": 18660,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650783820.039, "dur": 1.602, "args": { "External id": 18661,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650783958.841, "dur": 1.848, "args": { "External id": 18662,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650783964.817, "dur": 74.269, "args": { "External id": 18663,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650783973.895, "dur": 0.739, "args": { "External id": 18664,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650784046.714, "dur": 32.210, "args": { "External id": 18665,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650784048.459, "dur": 30.250, "args": { "External id": 18666,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784052.866, "dur": 5.392, "args": { "External id": 18667,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650784059.858, "dur": 18.309, "args": { "External id": 18668,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650784084.222, "dur": 5.651, "args": { "External id": 18669,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650784088.237, "dur": 1.529, "args": { "External id": 18670,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650784096.880, "dur": 2.196, "args": { "External id": 18671,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650784097.972, "dur": 0.996, "args": { "External id": 18672,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650784116.024, "dur": 17.789, "args": { "External id": 18673,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1264 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650784150.214, "dur": 9.322, "args": { "External id": 18674,"Record function id": 0, "Ev Idx": 1265 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650784152.843, "dur": 5.950, "args": { "External id": 18675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650784154.741, "dur": 3.067, "args": { "External id": 18676,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1267 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650784155.779, "dur": 1.935, "args": { "External id": 18677,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1268 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784163.528, "dur": 6.753, "args": { "External id": 18678,"Record function id": 0, "Sequence number": 246631, "Fwd thread id": 1, "Ev Idx": 1269 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784166.064, "dur": 1.030, "args": { "External id": 18679,"Sequence number": 246631, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1270 } }, { "ph": "f", "id": 137, "pid": 1336757, "tid": 1381170, "ts": 1295650784166.064, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650784174.214, "dur": 426.715, "args": { "External id": 18680,"Record function id": 0, "Sequence number": 246630, "Fwd thread id": 1, "Ev Idx": 1271 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650784175.597, "dur": 413.479, "args": { "External id": 18681,"Sequence number": 246630, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1272 } }, { "ph": "f", "id": 138, "pid": 1336757, "tid": 1381170, "ts": 1295650784175.597, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650784204.146, "dur": 8.096, "args": { "External id": 18682,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336757, "tid": 1381170, "ts": 1295650784208.970, "dur": 2.972, "args": { "External id": 18683,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 1274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650784215.136, "dur": 7.427, "args": { "External id": 18684,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650784216.756, "dur": 5.172, "args": { "External id": 18685,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784220.988, "dur": 0.797, "args": { "External id": 18686,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1381170, "ts": 1295650784225.945, "dur": 108.311, "args": { "External id": 18687,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 1278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650784226.608, "dur": 21.923, "args": { "External id": 18688,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 1279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650784242.701, "dur": 5.025, "args": { "External id": 18689,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784245.374, "dur": 2.033, "args": { "External id": 18690,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1381170, "ts": 1295650784250.235, "dur": 83.328, "args": { "External id": 18691,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 1282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650784251.697, "dur": 81.059, "args": { "External id": 18692,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 1283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650784340.664, "dur": 3.185, "args": { "External id": 18693,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 1284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650784342.269, "dur": 1.481, "args": { "External id": 18694,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 1285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650784377.001, "dur": 5.414, "args": { "External id": 18695,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650784383.953, "dur": 1.687, "args": { "External id": 18696,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650784387.087, "dur": 1.582, "args": { "External id": 18697,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650784423.334, "dur": 2.409, "args": { "External id": 18698,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650784424.363, "dur": 1.207, "args": { "External id": 18699,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336757, "tid": 1381170, "ts": 1295650784445.710, "dur": 122.053, "args": { "External id": 18700,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 1291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1381170, "ts": 1295650784450.996, "dur": 6.322, "args": { "External id": 18701,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784454.604, "dur": 1.886, "args": { "External id": 18702,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650784459.103, "dur": 6.761, "args": { "External id": 18703,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 1294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784462.301, "dur": 2.811, "args": { "External id": 18704,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 1295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1381170, "ts": 1295650784467.538, "dur": 2.908, "args": { "External id": 18705,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 1296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784469.501, "dur": 0.582, "args": { "External id": 18706,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650784471.328, "dur": 3.313, "args": { "External id": 18707,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 1298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784473.387, "dur": 0.615, "args": { "External id": 18708,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 1299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650784480.504, "dur": 3.724, "args": { "External id": 18709,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 1300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784483.428, "dur": 0.485, "args": { "External id": 18710,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 1301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650784485.296, "dur": 6.306, "args": { "External id": 18711,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 1302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336757, "tid": 1381170, "ts": 1295650784489.254, "dur": 2.143, "args": { "External id": 18712,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 1303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650784492.941, "dur": 2.906, "args": { "External id": 18713,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 1304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784495.250, "dur": 0.307, "args": { "External id": 18714,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 1305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650784497.014, "dur": 4.181, "args": { "External id": 18715,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 1306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650784498.321, "dur": 2.775, "args": { "External id": 18716,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 1307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295650784502.583, "dur": 51.680, "args": { "External id": 18717,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 1308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650784556.481, "dur": 2.603, "args": { "External id": 18718,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 1309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336757, "tid": 1381170, "ts": 1295650784560.299, "dur": 3.267, "args": { "External id": 18719,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 1310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784562.465, "dur": 0.499, "args": { "External id": 18720,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 1311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650784565.829, "dur": 0.884, "args": { "External id": 18721,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 1312 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650784611.915, "dur": 9.211, "args": { "External id": 18722,"Record function id": 0, "Ev Idx": 1313 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650784614.384, "dur": 5.967, "args": { "External id": 18723,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650784616.329, "dur": 3.258, "args": { "External id": 18724,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1315 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650784617.222, "dur": 2.240, "args": { "External id": 18725,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1316 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784625.220, "dur": 6.962, "args": { "External id": 18726,"Record function id": 0, "Sequence number": 246629, "Fwd thread id": 1, "Ev Idx": 1317 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784626.495, "dur": 3.885, "args": { "External id": 18727,"Sequence number": 246629, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 1318 } }, { "ph": "f", "id": 139, "pid": 1336757, "tid": 1381170, "ts": 1295650784626.495, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650784628.177, "dur": 2.007, "args": { "External id": 18728,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650784629.124, "dur": 0.943, "args": { "External id": 18729,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1320 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784635.564, "dur": 120.390, "args": { "External id": 18730,"Record function id": 0, "Sequence number": 246628, "Fwd thread id": 1, "Ev Idx": 1321 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784636.458, "dur": 113.136, "args": { "External id": 18731,"Sequence number": 246628, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1322 } }, { "ph": "f", "id": 140, "pid": 1336757, "tid": 1381170, "ts": 1295650784636.458, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650784641.662, "dur": 4.629, "args": { "External id": 18732,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650784643.211, "dur": 2.546, "args": { "External id": 18733,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 1324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784644.906, "dur": 0.716, "args": { "External id": 18734,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650784647.306, "dur": 39.644, "args": { "External id": 18735,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 1326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650784687.953, "dur": 5.950, "args": { "External id": 18736,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650784688.495, "dur": 4.620, "args": { "External id": 18737,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784692.218, "dur": 0.745, "args": { "External id": 18738,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650784695.317, "dur": 3.339, "args": { "External id": 18739,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650784696.416, "dur": 1.819, "args": { "External id": 18740,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784697.803, "dur": 0.341, "args": { "External id": 18741,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650784699.266, "dur": 49.531, "args": { "External id": 18742,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1333 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784760.528, "dur": 8.189, "args": { "External id": 18743,"Record function id": 0, "Sequence number": 246627, "Fwd thread id": 1, "Ev Idx": 1334 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784761.581, "dur": 5.575, "args": { "External id": 18744,"Sequence number": 246627, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1335 } }, { "ph": "f", "id": 141, "pid": 1336757, "tid": 1381170, "ts": 1295650784761.581, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650784763.049, "dur": 3.952, "args": { "External id": 18745,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650784765.749, "dur": 1.145, "args": { "External id": 18746,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1337 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784772.252, "dur": 7.162, "args": { "External id": 18747,"Record function id": 0, "Sequence number": 246626, "Fwd thread id": 1, "Ev Idx": 1338 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784773.037, "dur": 4.693, "args": { "External id": 18748,"Sequence number": 246626, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1339 } }, { "ph": "f", "id": 142, "pid": 1336757, "tid": 1381170, "ts": 1295650784773.037, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650784773.890, "dur": 3.595, "args": { "External id": 18749,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650784774.590, "dur": 2.417, "args": { "External id": 18750,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784776.589, "dur": 0.301, "args": { "External id": 18751,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1342 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650784783.489, "dur": 4.884, "args": { "External id": 18752,"Record function id": 0, "Ev Idx": 1343 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650784785.172, "dur": 2.695, "args": { "External id": 18753,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650784786.072, "dur": 1.562, "args": { "External id": 18754,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1345 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650784786.634, "dur": 0.931, "args": { "External id": 18755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1346 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784791.818, "dur": 7.592, "args": { "External id": 18756,"Record function id": 0, "Sequence number": 246625, "Fwd thread id": 1, "Ev Idx": 1347 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784793.198, "dur": 4.400, "args": { "External id": 18757,"Sequence number": 246625, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 1348 } }, { "ph": "f", "id": 143, "pid": 1336757, "tid": 1381170, "ts": 1295650784793.198, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650784795.830, "dur": 1.628, "args": { "External id": 18758,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650784796.660, "dur": 0.686, "args": { "External id": 18759,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1350 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784802.496, "dur": 107.748, "args": { "External id": 18760,"Record function id": 0, "Sequence number": 246624, "Fwd thread id": 1, "Ev Idx": 1351 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784803.286, "dur": 100.261, "args": { "External id": 18761,"Sequence number": 246624, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1352 } }, { "ph": "f", "id": 144, "pid": 1336757, "tid": 1381170, "ts": 1295650784803.286, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650784804.759, "dur": 5.114, "args": { "External id": 18762,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650784805.263, "dur": 4.111, "args": { "External id": 18763,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 1354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784808.616, "dur": 0.653, "args": { "External id": 18764,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650784810.443, "dur": 32.385, "args": { "External id": 18765,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 1356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650784843.848, "dur": 4.361, "args": { "External id": 18766,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650784844.615, "dur": 3.040, "args": { "External id": 18767,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784846.519, "dur": 1.001, "args": { "External id": 18768,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650784849.287, "dur": 6.087, "args": { "External id": 18769,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650784850.034, "dur": 4.901, "args": { "External id": 18770,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784852.834, "dur": 2.037, "args": { "External id": 18771,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650784855.967, "dur": 46.866, "args": { "External id": 18772,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1363 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784916.429, "dur": 30.070, "args": { "External id": 18773,"Record function id": 0, "Sequence number": 246623, "Fwd thread id": 1, "Ev Idx": 1364 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784917.425, "dur": 3.786, "args": { "External id": 18774,"Sequence number": 246623, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1365 } }, { "ph": "f", "id": 145, "pid": 1336757, "tid": 1381170, "ts": 1295650784917.425, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650784919.078, "dur": 1.978, "args": { "External id": 18775,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650784919.860, "dur": 1.053, "args": { "External id": 18776,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1381170, "ts": 1295650784923.771, "dur": 19.593, "args": { "External id": 18777,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1368 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784950.125, "dur": 9.436, "args": { "External id": 18778,"Record function id": 0, "Sequence number": 246622, "Fwd thread id": 1, "Ev Idx": 1369 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650784951.117, "dur": 6.311, "args": { "External id": 18779,"Sequence number": 246622, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1370 } }, { "ph": "f", "id": 146, "pid": 1336757, "tid": 1381170, "ts": 1295650784951.117, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650784951.902, "dur": 5.305, "args": { "External id": 18780,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650784954.775, "dur": 1.928, "args": { "External id": 18781,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650784956.242, "dur": 0.341, "args": { "External id": 18782,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1373 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650784963.699, "dur": 5.022, "args": { "External id": 18783,"Record function id": 0, "Ev Idx": 1374 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650784965.486, "dur": 2.765, "args": { "External id": 18784,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650784966.339, "dur": 1.620, "args": { "External id": 18785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1376 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650784966.844, "dur": 1.030, "args": { "External id": 18786,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1377 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650784972.938, "dur": 473.415, "args": { "External id": 18787,"Record function id": 0, "Sequence number": 246621, "Fwd thread id": 1, "Ev Idx": 1378 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650784978.326, "dur": 433.826, "args": { "External id": 18788,"Sequence number": 246621, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 1379 } }, { "ph": "f", "id": 147, "pid": 1336757, "tid": 1381170, "ts": 1295650784978.326, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1381170, "ts": 1295650785036.949, "dur": 39.757, "args": { "External id": 18789,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650785038.362, "dur": 38.156, "args": { "External id": 18790,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650785041.499, "dur": 8.047, "args": { "External id": 18791,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 1382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650785044.767, "dur": 3.947, "args": { "External id": 18792,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650785051.090, "dur": 24.904, "args": { "External id": 18793,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650785090.235, "dur": 2.687, "args": { "External id": 18794,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650785091.084, "dur": 1.690, "args": { "External id": 18795,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650785096.527, "dur": 2.966, "args": { "External id": 18796,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650785097.466, "dur": 1.935, "args": { "External id": 18797,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650785113.403, "dur": 2.526, "args": { "External id": 18798,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650785126.342, "dur": 3.388, "args": { "External id": 18799,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650785300.485, "dur": 4.110, "args": { "External id": 18800,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650785309.174, "dur": 34.651, "args": { "External id": 18801,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650785319.326, "dur": 0.955, "args": { "External id": 18802,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650785349.309, "dur": 29.959, "args": { "External id": 18803,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650785351.221, "dur": 27.840, "args": { "External id": 18804,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650785355.573, "dur": 3.830, "args": { "External id": 18805,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650785362.726, "dur": 15.787, "args": { "External id": 18806,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650785383.492, "dur": 2.484, "args": { "External id": 18807,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650785384.760, "dur": 1.068, "args": { "External id": 18808,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650785393.459, "dur": 2.957, "args": { "External id": 18809,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650785394.776, "dur": 1.536, "args": { "External id": 18810,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650785398.867, "dur": 2.935, "args": { "External id": 18811,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650785400.011, "dur": 1.692, "args": { "External id": 18812,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650785427.205, "dur": 17.292, "args": { "External id": 18813,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1404 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650785460.332, "dur": 9.333, "args": { "External id": 18814,"Record function id": 0, "Ev Idx": 1405 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650785462.965, "dur": 5.984, "args": { "External id": 18815,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650785465.206, "dur": 2.922, "args": { "External id": 18816,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1407 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650785466.279, "dur": 1.774, "args": { "External id": 18817,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1408 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650785473.439, "dur": 10.036, "args": { "External id": 18818,"Record function id": 0, "Sequence number": 246620, "Fwd thread id": 1, "Ev Idx": 1409 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650785475.128, "dur": 6.310, "args": { "External id": 18819,"Sequence number": 246620, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1410 } }, { "ph": "f", "id": 148, "pid": 1336757, "tid": 1381170, "ts": 1295650785475.128, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650785476.770, "dur": 4.475, "args": { "External id": 18820,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650785479.824, "dur": 1.254, "args": { "External id": 18821,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1412 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650785486.827, "dur": 127.888, "args": { "External id": 18822,"Record function id": 0, "Sequence number": 246619, "Fwd thread id": 1, "Ev Idx": 1413 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650785487.740, "dur": 120.281, "args": { "External id": 18823,"Sequence number": 246619, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1414 } }, { "ph": "f", "id": 149, "pid": 1336757, "tid": 1381170, "ts": 1295650785487.740, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650785490.778, "dur": 5.210, "args": { "External id": 18824,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650785491.943, "dur": 3.380, "args": { "External id": 18825,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650785494.274, "dur": 0.871, "args": { "External id": 18826,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650785497.218, "dur": 56.832, "args": { "External id": 18827,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650785557.342, "dur": 4.945, "args": { "External id": 18828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650785558.073, "dur": 3.466, "args": { "External id": 18829,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650785560.145, "dur": 1.217, "args": { "External id": 18830,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650785563.471, "dur": 3.289, "args": { "External id": 18831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650785564.315, "dur": 1.923, "args": { "External id": 18832,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650785565.729, "dur": 0.415, "args": { "External id": 18833,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650785569.175, "dur": 38.014, "args": { "External id": 18834,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1425 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650785619.506, "dur": 7.778, "args": { "External id": 18835,"Record function id": 0, "Sequence number": 246618, "Fwd thread id": 1, "Ev Idx": 1426 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650785620.255, "dur": 5.068, "args": { "External id": 18836,"Sequence number": 246618, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1427 } }, { "ph": "f", "id": 150, "pid": 1336757, "tid": 1381170, "ts": 1295650785620.255, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650785621.938, "dur": 3.234, "args": { "External id": 18837,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650785622.835, "dur": 2.242, "args": { "External id": 18838,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1429 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650785630.675, "dur": 9.143, "args": { "External id": 18839,"Record function id": 0, "Sequence number": 246617, "Fwd thread id": 1, "Ev Idx": 1430 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650785631.410, "dur": 6.459, "args": { "External id": 18840,"Sequence number": 246617, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1431 } }, { "ph": "f", "id": 151, "pid": 1336757, "tid": 1381170, "ts": 1295650785631.410, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650785632.221, "dur": 5.415, "args": { "External id": 18841,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650785633.145, "dur": 3.978, "args": { "External id": 18842,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650785636.706, "dur": 0.304, "args": { "External id": 18843,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1434 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650785643.949, "dur": 5.228, "args": { "External id": 18844,"Record function id": 0, "Ev Idx": 1435 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650785645.792, "dur": 2.857, "args": { "External id": 18845,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650785646.930, "dur": 1.474, "args": { "External id": 18846,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1437 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650785647.339, "dur": 0.970, "args": { "External id": 18847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1438 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650785652.240, "dur": 6.266, "args": { "External id": 18848,"Record function id": 0, "Sequence number": 246616, "Fwd thread id": 1, "Ev Idx": 1439 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650785653.088, "dur": 3.491, "args": { "External id": 18849,"Sequence number": 246616, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1440 } }, { "ph": "f", "id": 152, "pid": 1336757, "tid": 1381170, "ts": 1295650785653.088, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650785654.332, "dur": 2.116, "args": { "External id": 18850,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650785655.208, "dur": 1.099, "args": { "External id": 18851,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1442 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650785662.606, "dur": 262.933, "args": { "External id": 18852,"Record function id": 0, "Sequence number": 246615, "Fwd thread id": 1, "Ev Idx": 1443 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650785664.209, "dur": 245.726, "args": { "External id": 18853,"Sequence number": 246615, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1444 } }, { "ph": "f", "id": 153, "pid": 1336757, "tid": 1381170, "ts": 1295650785664.209, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650785677.137, "dur": 6.018, "args": { "External id": 18854,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650785679.484, "dur": 3.286, "args": { "External id": 18855,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650785684.877, "dur": 4.186, "args": { "External id": 18856,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650785686.638, "dur": 2.201, "args": { "External id": 18857,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650785690.736, "dur": 4.294, "args": { "External id": 18858,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650785693.075, "dur": 1.736, "args": { "External id": 18859,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1450 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650785717.077, "dur": 168.992, "args": { "External id": 18860,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650785793.004, "dur": 4.067, "args": { "External id": 18861,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650785799.160, "dur": 3.187, "args": { "External id": 18862,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650785897.805, "dur": 3.634, "args": { "External id": 18863,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650785904.367, "dur": 0.698, "args": { "External id": 18864,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1381170, "ts": 1295650785906.759, "dur": 0.682, "args": { "External id": 18865,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1456 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650785932.379, "dur": 276.525, "args": { "External id": 18866,"Record function id": 0, "Sequence number": 246614, "Fwd thread id": 1, "Ev Idx": 1457 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650785934.617, "dur": 266.383, "args": { "External id": 18867,"Sequence number": 246614, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1458 } }, { "ph": "f", "id": 154, "pid": 1336757, "tid": 1381170, "ts": 1295650785934.617, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650785951.627, "dur": 95.701, "args": { "External id": 18868,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650785954.458, "dur": 2.487, "args": { "External id": 18869,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650785958.110, "dur": 88.213, "args": { "External id": 18870,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650786059.233, "dur": 6.385, "args": { "External id": 18871,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786061.649, "dur": 3.649, "args": { "External id": 18872,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1463 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650786218.246, "dur": 181.673, "args": { "External id": 18873,"Record function id": 0, "Sequence number": 246613, "Fwd thread id": 1, "Ev Idx": 1464 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650786220.490, "dur": 171.445, "args": { "External id": 18874,"Sequence number": 246613, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1465 } }, { "ph": "f", "id": 155, "pid": 1336757, "tid": 1381170, "ts": 1295650786220.490, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1381170, "ts": 1295650786249.407, "dur": 38.811, "args": { "External id": 18875,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786252.193, "dur": 3.951, "args": { "External id": 18876,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650786257.250, "dur": 30.449, "args": { "External id": 18877,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1381170, "ts": 1295650786295.565, "dur": 5.139, "args": { "External id": 18878,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786297.575, "dur": 2.783, "args": { "External id": 18879,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1470 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786407.935, "dur": 14.138, "args": { "External id": 18880,"Record function id": 0, "Sequence number": 246612, "Fwd thread id": 1, "Ev Idx": 1471 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786409.349, "dur": 10.244, "args": { "External id": 18881,"Sequence number": 246612, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1472 } }, { "ph": "f", "id": 156, "pid": 1336757, "tid": 1381170, "ts": 1295650786409.349, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650786411.872, "dur": 7.417, "args": { "External id": 18882,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650786413.456, "dur": 5.636, "args": { "External id": 18883,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1474 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786425.531, "dur": 6.147, "args": { "External id": 18884,"Record function id": 0, "Sequence number": 246611, "Fwd thread id": 1, "Ev Idx": 1475 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786426.306, "dur": 3.900, "args": { "External id": 18885,"Sequence number": 246611, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1476 } }, { "ph": "f", "id": 157, "pid": 1336757, "tid": 1381170, "ts": 1295650786426.306, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650786427.769, "dur": 2.282, "args": { "External id": 18886,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650786428.936, "dur": 0.972, "args": { "External id": 18887,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1478 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786435.001, "dur": 7.696, "args": { "External id": 18888,"Record function id": 0, "Sequence number": 246610, "Fwd thread id": 1, "Ev Idx": 1479 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786435.675, "dur": 5.349, "args": { "External id": 18889,"Sequence number": 246610, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1480 } }, { "ph": "f", "id": 158, "pid": 1336757, "tid": 1381170, "ts": 1295650786435.675, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650786439.126, "dur": 1.759, "args": { "External id": 18890,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650786439.918, "dur": 0.876, "args": { "External id": 18891,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1482 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786446.253, "dur": 6.413, "args": { "External id": 18892,"Record function id": 0, "Sequence number": 246609, "Fwd thread id": 1, "Ev Idx": 1483 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786447.548, "dur": 3.171, "args": { "External id": 18893,"Sequence number": 246609, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1484 } }, { "ph": "f", "id": 159, "pid": 1336757, "tid": 1381170, "ts": 1295650786447.548, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650786448.735, "dur": 1.844, "args": { "External id": 18894,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650786449.703, "dur": 0.792, "args": { "External id": 18895,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1486 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786455.694, "dur": 144.608, "args": { "External id": 18896,"Record function id": 0, "Sequence number": 246608, "Fwd thread id": 1, "Ev Idx": 1487 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786456.555, "dur": 137.000, "args": { "External id": 18897,"Sequence number": 246608, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1488 } }, { "ph": "f", "id": 160, "pid": 1336757, "tid": 1381170, "ts": 1295650786456.555, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786460.118, "dur": 9.146, "args": { "External id": 18898,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786464.092, "dur": 4.514, "args": { "External id": 18899,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786466.757, "dur": 1.527, "args": { "External id": 18900,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650786470.875, "dur": 65.061, "args": { "External id": 18901,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786537.218, "dur": 5.024, "args": { "External id": 18902,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786538.005, "dur": 3.568, "args": { "External id": 18903,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786540.315, "dur": 1.080, "args": { "External id": 18904,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786543.845, "dur": 6.068, "args": { "External id": 18905,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786547.315, "dur": 2.137, "args": { "External id": 18906,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786548.991, "dur": 0.393, "args": { "External id": 18907,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650786550.694, "dur": 42.008, "args": { "External id": 18908,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1499 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786604.855, "dur": 7.007, "args": { "External id": 18909,"Record function id": 0, "Sequence number": 246607, "Fwd thread id": 1, "Ev Idx": 1500 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786605.759, "dur": 4.144, "args": { "External id": 18910,"Sequence number": 246607, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1501 } }, { "ph": "f", "id": 161, "pid": 1336757, "tid": 1381170, "ts": 1295650786605.759, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650786607.506, "dur": 2.267, "args": { "External id": 18911,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650786608.610, "dur": 1.058, "args": { "External id": 18912,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1503 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786615.166, "dur": 9.235, "args": { "External id": 18913,"Record function id": 0, "Sequence number": 246606, "Fwd thread id": 1, "Ev Idx": 1504 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786616.159, "dur": 6.255, "args": { "External id": 18914,"Sequence number": 246606, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1505 } }, { "ph": "f", "id": 162, "pid": 1336757, "tid": 1381170, "ts": 1295650786616.159, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786619.034, "dur": 3.162, "args": { "External id": 18915,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786619.560, "dur": 2.157, "args": { "External id": 18916,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786621.304, "dur": 0.313, "args": { "External id": 18917,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1508 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650786630.327, "dur": 9.223, "args": { "External id": 18918,"Record function id": 0, "Ev Idx": 1509 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650786632.010, "dur": 6.811, "args": { "External id": 18919,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650786634.344, "dur": 4.105, "args": { "External id": 18920,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1511 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650786635.657, "dur": 2.696, "args": { "External id": 18921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1512 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786643.105, "dur": 8.521, "args": { "External id": 18922,"Record function id": 0, "Sequence number": 246605, "Fwd thread id": 1, "Ev Idx": 1513 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786644.532, "dur": 5.606, "args": { "External id": 18923,"Sequence number": 246605, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1514 } }, { "ph": "f", "id": 163, "pid": 1336757, "tid": 1381170, "ts": 1295650786644.532, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650786645.852, "dur": 4.143, "args": { "External id": 18924,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650786649.022, "dur": 0.888, "args": { "External id": 18925,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1516 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786654.822, "dur": 86.497, "args": { "External id": 18926,"Record function id": 0, "Sequence number": 246604, "Fwd thread id": 1, "Ev Idx": 1517 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786655.899, "dur": 81.184, "args": { "External id": 18927,"Sequence number": 246604, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1518 } }, { "ph": "f", "id": 164, "pid": 1336757, "tid": 1381170, "ts": 1295650786655.899, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786657.567, "dur": 3.391, "args": { "External id": 18928,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786658.257, "dur": 2.255, "args": { "External id": 18929,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786659.846, "dur": 0.542, "args": { "External id": 18930,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650786661.888, "dur": 26.583, "args": { "External id": 18931,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786692.069, "dur": 4.042, "args": { "External id": 18932,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786692.642, "dur": 2.961, "args": { "External id": 18933,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786694.493, "dur": 0.983, "args": { "External id": 18934,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786697.231, "dur": 4.265, "args": { "External id": 18935,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786697.923, "dur": 3.128, "args": { "External id": 18936,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786699.623, "dur": 1.301, "args": { "External id": 18937,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650786703.956, "dur": 32.329, "args": { "External id": 18938,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1529 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786747.782, "dur": 34.273, "args": { "External id": 18939,"Record function id": 0, "Sequence number": 246603, "Fwd thread id": 1, "Ev Idx": 1530 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786748.768, "dur": 6.631, "args": { "External id": 18940,"Sequence number": 246603, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1531 } }, { "ph": "f", "id": 165, "pid": 1336757, "tid": 1381170, "ts": 1295650786748.768, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650786750.302, "dur": 4.946, "args": { "External id": 18941,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650786754.046, "dur": 1.038, "args": { "External id": 18942,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1381170, "ts": 1295650786758.339, "dur": 21.387, "args": { "External id": 18943,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1534 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786785.813, "dur": 30.702, "args": { "External id": 18944,"Record function id": 0, "Sequence number": 246602, "Fwd thread id": 1, "Ev Idx": 1535 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786807.202, "dur": 7.355, "args": { "External id": 18945,"Sequence number": 246602, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1536 } }, { "ph": "f", "id": 166, "pid": 1336757, "tid": 1381170, "ts": 1295650786807.202, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786810.832, "dur": 3.528, "args": { "External id": 18946,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786811.388, "dur": 2.452, "args": { "External id": 18947,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786813.294, "dur": 0.421, "args": { "External id": 18948,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1539 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650786820.616, "dur": 4.857, "args": { "External id": 18949,"Record function id": 0, "Ev Idx": 1540 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650786822.408, "dur": 2.543, "args": { "External id": 18950,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650786823.307, "dur": 1.369, "args": { "External id": 18951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1542 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650786823.718, "dur": 0.866, "args": { "External id": 18952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1543 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786828.729, "dur": 8.921, "args": { "External id": 18953,"Record function id": 0, "Sequence number": 246601, "Fwd thread id": 1, "Ev Idx": 1544 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786830.226, "dur": 5.076, "args": { "External id": 18954,"Sequence number": 246601, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1545 } }, { "ph": "f", "id": 167, "pid": 1336757, "tid": 1381170, "ts": 1295650786830.226, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650786831.275, "dur": 3.879, "args": { "External id": 18955,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650786834.242, "dur": 0.826, "args": { "External id": 18956,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1547 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786840.846, "dur": 87.360, "args": { "External id": 18957,"Record function id": 0, "Sequence number": 246600, "Fwd thread id": 1, "Ev Idx": 1548 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786841.567, "dur": 80.088, "args": { "External id": 18958,"Sequence number": 246600, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1549 } }, { "ph": "f", "id": 168, "pid": 1336757, "tid": 1381170, "ts": 1295650786841.567, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786843.561, "dur": 2.752, "args": { "External id": 18959,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786844.035, "dur": 1.842, "args": { "External id": 18960,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786845.366, "dur": 0.382, "args": { "External id": 18961,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650786846.972, "dur": 27.441, "args": { "External id": 18962,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786877.858, "dur": 2.979, "args": { "External id": 18963,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786878.398, "dur": 1.845, "args": { "External id": 18964,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786879.679, "dur": 0.437, "args": { "External id": 18965,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786881.879, "dur": 2.874, "args": { "External id": 18966,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786882.649, "dur": 1.688, "args": { "External id": 18967,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786883.969, "dur": 0.294, "args": { "External id": 18968,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650786887.302, "dur": 33.725, "args": { "External id": 18969,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1560 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786932.703, "dur": 23.889, "args": { "External id": 18970,"Record function id": 0, "Sequence number": 246599, "Fwd thread id": 1, "Ev Idx": 1561 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786933.508, "dur": 3.748, "args": { "External id": 18971,"Sequence number": 246599, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1562 } }, { "ph": "f", "id": 169, "pid": 1336757, "tid": 1381170, "ts": 1295650786933.508, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650786934.870, "dur": 2.215, "args": { "External id": 18972,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650786935.705, "dur": 1.272, "args": { "External id": 18973,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650786939.375, "dur": 15.203, "args": { "External id": 18974,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1565 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786960.037, "dur": 8.925, "args": { "External id": 18975,"Record function id": 0, "Sequence number": 246598, "Fwd thread id": 1, "Ev Idx": 1566 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336757, "tid": 1381170, "ts": 1295650786960.856, "dur": 6.222, "args": { "External id": 18976,"Sequence number": 246598, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1567 } }, { "ph": "f", "id": 170, "pid": 1336757, "tid": 1381170, "ts": 1295650786960.856, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1381170, "ts": 1295650786961.522, "dur": 5.363, "args": { "External id": 18977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1381170, "ts": 1295650786962.261, "dur": 4.060, "args": { "External id": 18978,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650786965.749, "dur": 0.449, "args": { "External id": 18979,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1570 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650786972.939, "dur": 4.548, "args": { "External id": 18980,"Record function id": 0, "Ev Idx": 1571 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650786974.689, "dur": 2.326, "args": { "External id": 18981,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650786975.482, "dur": 1.276, "args": { "External id": 18982,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1573 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650786975.821, "dur": 0.835, "args": { "External id": 18983,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1574 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650786981.847, "dur": 407.555, "args": { "External id": 18984,"Record function id": 0, "Sequence number": 246597, "Fwd thread id": 1, "Ev Idx": 1575 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650786983.407, "dur": 370.664, "args": { "External id": 18985,"Sequence number": 246597, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1576 } }, { "ph": "f", "id": 171, "pid": 1336757, "tid": 1381170, "ts": 1295650786983.407, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650787053.004, "dur": 3.244, "args": { "External id": 18986,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650787054.103, "dur": 1.854, "args": { "External id": 18987,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650787071.962, "dur": 5.733, "args": { "External id": 18988,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650787086.792, "dur": 2.268, "args": { "External id": 18989,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650787245.694, "dur": 2.996, "args": { "External id": 18990,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1381170, "ts": 1295650787253.590, "dur": 39.069, "args": { "External id": 18991,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787265.314, "dur": 1.140, "args": { "External id": 18992,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650787298.425, "dur": 32.270, "args": { "External id": 18993,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650787300.094, "dur": 30.399, "args": { "External id": 18994,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787304.477, "dur": 4.175, "args": { "External id": 18995,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650787312.549, "dur": 17.363, "args": { "External id": 18996,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1381170, "ts": 1295650787335.230, "dur": 2.681, "args": { "External id": 18997,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650787336.682, "dur": 1.118, "args": { "External id": 18998,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1381170, "ts": 1295650787344.369, "dur": 2.617, "args": { "External id": 18999,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650787345.671, "dur": 1.208, "args": { "External id": 19000,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1381170, "ts": 1295650787367.501, "dur": 17.025, "args": { "External id": 19001,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1592 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650787402.166, "dur": 11.949, "args": { "External id": 19002,"Record function id": 0, "Ev Idx": 1593 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650787404.901, "dur": 8.536, "args": { "External id": 19003,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650787406.939, "dur": 5.527, "args": { "External id": 19004,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1595 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650787410.164, "dur": 2.175, "args": { "External id": 19005,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1596 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650787418.393, "dur": 2637.395, "args": { "External id": 19006,"Record function id": 0, "Ev Idx": 1597 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.27)", "pid": 1336757, "tid": 1381170, "ts": 1295650787447.309, "dur": 895.429, "args": { "External id": 19007,"Record function id": 0, "Ev Idx": 1598 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.26", "pid": 1336757, "tid": 1381170, "ts": 1295650787469.806, "dur": 863.601, "args": { "External id": 19008,"Record function id": 0, "Ev Idx": 1599 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.26)", "pid": 1336757, "tid": 1381170, "ts": 1295650787484.749, "dur": 832.975, "args": { "External id": 19009,"Record function id": 0, "Ev Idx": 1600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650787556.208, "dur": 4.652, "args": { "External id": 19010,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295650787576.236, "dur": 30.610, "args": { "External id": 19011,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787580.609, "dur": 1.085, "args": { "External id": 19012,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787583.866, "dur": 1.997, "args": { "External id": 19013,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787587.637, "dur": 0.346, "args": { "External id": 19014,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787589.972, "dur": 0.437, "args": { "External id": 19015,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787592.086, "dur": 0.356, "args": { "External id": 19016,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787594.479, "dur": 0.468, "args": { "External id": 19017,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787596.765, "dur": 0.320, "args": { "External id": 19018,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787599.125, "dur": 0.333, "args": { "External id": 19019,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787601.600, "dur": 0.340, "args": { "External id": 19020,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650787621.618, "dur": 30.124, "args": { "External id": 19021,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1612 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295650787687.552, "dur": 105.760, "args": { "External id": 19022,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 1613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650787698.783, "dur": 4.833, "args": { "External id": 19023,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295650787708.792, "dur": 10.385, "args": { "External id": 19024,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650787712.736, "dur": 6.029, "args": { "External id": 19025,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 1616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787716.676, "dur": 0.650, "args": { "External id": 19026,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295650787726.450, "dur": 26.813, "args": { "External id": 19027,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787729.184, "dur": 0.332, "args": { "External id": 19028,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787731.499, "dur": 0.485, "args": { "External id": 19029,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787733.871, "dur": 0.373, "args": { "External id": 19030,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787735.923, "dur": 0.381, "args": { "External id": 19031,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787737.890, "dur": 0.403, "args": { "External id": 19032,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787740.164, "dur": 0.441, "args": { "External id": 19033,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787742.400, "dur": 1.319, "args": { "External id": 19034,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787745.409, "dur": 0.401, "args": { "External id": 19035,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650787747.466, "dur": 0.443, "args": { "External id": 19036,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650787763.682, "dur": 21.800, "args": { "External id": 19037,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1628 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295650787845.993, "dur": 353.105, "args": { "External id": 19038,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 1629 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295650787870.681, "dur": 323.041, "args": { "External id": 19039,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1630, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295650787880.881, "dur": 306.711, "args": { "External id": 19040,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 1631 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295650788221.063, "dur": 2.348, "args": { "External id": 19041,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1632, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650788351.137, "dur": 1683.209, "args": { "External id": 19042,"Sequence number": 246596, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1633 } }, { "ph": "f", "id": 172, "pid": 1336757, "tid": 1381170, "ts": 1295650788351.137, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650788470.397, "dur": 108.573, "args": { "External id": 19043,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 1634 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295650788617.688, "dur": 41.609, "args": { "External id": 19044,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 1635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295650788680.602, "dur": 52.118, "args": { "External id": 19045,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 1636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650788742.567, "dur": 34.125, "args": { "External id": 19046,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650788784.098, "dur": 47.163, "args": { "External id": 19047,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650788839.980, "dur": 29.273, "args": { "External id": 19048,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650788876.408, "dur": 43.665, "args": { "External id": 19049,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1640 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295650788943.759, "dur": 23.568, "args": { "External id": 19050,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 1641 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295650789027.725, "dur": 33.910, "args": { "External id": 19051,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1642 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295650789086.274, "dur": 23.030, "args": { "External id": 19052,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1643 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295650789124.937, "dur": 17.847, "args": { "External id": 19053,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650789154.555, "dur": 35.105, "args": { "External id": 19054,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650789192.714, "dur": 48.899, "args": { "External id": 19055,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1646 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650789273.848, "dur": 177.792, "args": { "External id": 19056,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650789356.630, "dur": 5.682, "args": { "External id": 19057,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650789364.472, "dur": 3.308, "args": { "External id": 19058,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1649 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295650789484.096, "dur": 27.754, "args": { "External id": 19059,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1650 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295650789525.253, "dur": 16.146, "args": { "External id": 19060,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650789550.599, "dur": 41.676, "args": { "External id": 19061,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650789599.856, "dur": 37.662, "args": { "External id": 19062,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650789645.076, "dur": 22.987, "args": { "External id": 19063,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650789674.587, "dur": 31.422, "args": { "External id": 19064,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650789712.418, "dur": 22.264, "args": { "External id": 19065,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650789742.324, "dur": 31.684, "args": { "External id": 19066,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1657 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295650789792.113, "dur": 25.090, "args": { "External id": 19067,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 1658 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295650789835.139, "dur": 26.542, "args": { "External id": 19068,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1659 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295650789877.410, "dur": 18.251, "args": { "External id": 19069,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1660 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295650789908.571, "dur": 16.028, "args": { "External id": 19070,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1661 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295650789940.390, "dur": 16.609, "args": { "External id": 19071,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 1662 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790078.235, "dur": 15.944, "args": { "External id": 19072,"Record function id": 0, "Ev Idx": 1663 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790082.148, "dur": 11.158, "args": { "External id": 19073,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790086.337, "dur": 6.077, "args": { "External id": 19074,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1665 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790088.182, "dur": 4.079, "args": { "External id": 19075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1666 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790098.260, "dur": 5.577, "args": { "External id": 19076,"Record function id": 0, "Ev Idx": 1667 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790100.102, "dur": 3.227, "args": { "External id": 19077,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790100.883, "dur": 1.934, "args": { "External id": 19078,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1669 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790101.688, "dur": 1.025, "args": { "External id": 19079,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1670 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790107.166, "dur": 5.507, "args": { "External id": 19080,"Record function id": 0, "Ev Idx": 1671 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790109.071, "dur": 3.172, "args": { "External id": 19081,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790110.012, "dur": 1.781, "args": { "External id": 19082,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1673 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790110.711, "dur": 0.995, "args": { "External id": 19083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1674 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790116.233, "dur": 5.360, "args": { "External id": 19084,"Record function id": 0, "Ev Idx": 1675 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790118.116, "dur": 3.067, "args": { "External id": 19085,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790118.580, "dur": 2.209, "args": { "External id": 19086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1677 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790118.866, "dur": 1.836, "args": { "External id": 19087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1678 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790124.930, "dur": 3.699, "args": { "External id": 19088,"Record function id": 0, "Ev Idx": 1679 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790126.227, "dur": 1.966, "args": { "External id": 19089,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790126.677, "dur": 1.096, "args": { "External id": 19090,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1681 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790127.142, "dur": 0.540, "args": { "External id": 19091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1682 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790131.895, "dur": 4.569, "args": { "External id": 19092,"Record function id": 0, "Ev Idx": 1683 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790133.349, "dur": 2.669, "args": { "External id": 19093,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790133.791, "dur": 1.820, "args": { "External id": 19094,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1685 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790134.725, "dur": 0.803, "args": { "External id": 19095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1686 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790139.908, "dur": 4.480, "args": { "External id": 19096,"Record function id": 0, "Ev Idx": 1687 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790141.877, "dur": 2.084, "args": { "External id": 19097,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790142.564, "dur": 1.006, "args": { "External id": 19098,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1689 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790143.031, "dur": 0.458, "args": { "External id": 19099,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1690 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790147.787, "dur": 4.404, "args": { "External id": 19100,"Record function id": 0, "Ev Idx": 1691 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790149.650, "dur": 2.094, "args": { "External id": 19101,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790150.093, "dur": 1.161, "args": { "External id": 19102,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1693 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790150.581, "dur": 0.569, "args": { "External id": 19103,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1694 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790155.456, "dur": 4.057, "args": { "External id": 19104,"Record function id": 0, "Ev Idx": 1695 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650790156.691, "dur": 2.399, "args": { "External id": 19105,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790157.314, "dur": 1.353, "args": { "External id": 19106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1697 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650790157.954, "dur": 0.605, "args": { "External id": 19107,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1698 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650790164.200, "dur": 161598.343, "args": { "External id": 19108,"Record function id": 0, "Sequence number": 246595, "Fwd thread id": 1, "Ev Idx": 1699 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650790165.845, "dur": 161588.172, "args": { "External id": 19109,"Sequence number": 246595, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1700 } }, { "ph": "f", "id": 173, "pid": 1336757, "tid": 1381170, "ts": 1295650790165.845, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.27)", "pid": 1336757, "tid": 1381170, "ts": 1295650790196.450, "dur": 53.565, "args": { "External id": 19110,"Record function id": 0, "Ev Idx": 1701 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.27)", "pid": 1336757, "tid": 1381170, "ts": 1295650790259.848, "dur": 71.410, "args": { "External id": 19111,"Record function id": 0, "Ev Idx": 1702 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.27)", "pid": 1336757, "tid": 1381170, "ts": 1295650790337.503, "dur": 161407.944, "args": { "External id": 19112,"Record function id": 0, "Ev Idx": 1703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650790393.700, "dur": 8.396, "args": { "External id": 19113,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650790412.619, "dur": 4.992, "args": { "External id": 19114,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1705 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295650790434.179, "dur": 160422.666, "args": { "External id": 19115,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295650790449.904, "dur": 160396.283, "args": { "External id": 19116,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650790545.523, "dur": 5.014, "args": { "External id": 19117,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650790561.553, "dur": 160226.975, "args": { "External id": 19118,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 1709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650790564.303, "dur": 160223.187, "args": { "External id": 19119,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 1710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650790568.291, "dur": 4.745, "args": { "External id": 19120,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650790574.806, "dur": 160207.346, "args": { "External id": 19121,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 1712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295650950962.380, "dur": 12.531, "args": { "External id": 19122,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 1713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650950966.360, "dur": 8.215, "args": { "External id": 19123,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1714 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295650951044.901, "dur": 356.234, "args": { "External id": 19124,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 1715 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295650951073.286, "dur": 322.855, "args": { "External id": 19125,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1716, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295650951086.308, "dur": 303.687, "args": { "External id": 19126,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 1717 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295650951422.237, "dur": 2.393, "args": { "External id": 19127,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1718, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650951498.063, "dur": 7.942, "args": { "External id": 19128,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650951564.748, "dur": 1.735, "args": { "External id": 19129,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650951585.371, "dur": 1.282, "args": { "External id": 19130,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650951601.415, "dur": 0.849, "args": { "External id": 19131,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650951616.063, "dur": 0.997, "args": { "External id": 19132,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650951628.726, "dur": 1.102, "args": { "External id": 19133,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650951642.665, "dur": 1.272, "args": { "External id": 19134,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650951665.146, "dur": 2.489, "args": { "External id": 19135,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650951680.161, "dur": 1.082, "args": { "External id": 19136,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1727 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650951785.145, "dur": 2845.392, "args": { "External id": 19137,"Record function id": 0, "Ev Idx": 1728 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.26)", "pid": 1336757, "tid": 1381170, "ts": 1295650951804.237, "dur": 1070.634, "args": { "External id": 19138,"Record function id": 0, "Ev Idx": 1729 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.26)", "pid": 1336757, "tid": 1381170, "ts": 1295650951819.196, "dur": 376.451, "args": { "External id": 19139,"Record function id": 0, "Ev Idx": 1730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650951895.284, "dur": 3.948, "args": { "External id": 19140,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650951902.609, "dur": 0.983, "args": { "External id": 19141,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650951905.518, "dur": 1.107, "args": { "External id": 19142,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650951908.174, "dur": 2.409, "args": { "External id": 19143,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650951912.108, "dur": 1.001, "args": { "External id": 19144,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650951914.735, "dur": 0.820, "args": { "External id": 19145,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650951917.198, "dur": 2.188, "args": { "External id": 19146,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650951920.998, "dur": 0.953, "args": { "External id": 19147,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650951923.549, "dur": 0.924, "args": { "External id": 19148,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650951925.941, "dur": 0.835, "args": { "External id": 19149,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1740 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650951945.503, "dur": 206.504, "args": { "External id": 19150,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650951962.281, "dur": 184.357, "args": { "External id": 19151,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650952027.199, "dur": 13.752, "args": { "External id": 19152,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650952044.611, "dur": 69.793, "args": { "External id": 19153,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 1744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650952047.121, "dur": 66.965, "args": { "External id": 19154,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 1745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952051.357, "dur": 8.522, "args": { "External id": 19155,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650952062.088, "dur": 51.426, "args": { "External id": 19156,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 1747 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.25", "pid": 1336757, "tid": 1381170, "ts": 1295650952300.128, "dur": 566.406, "args": { "External id": 19157,"Record function id": 0, "Ev Idx": 1748 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.25)", "pid": 1336757, "tid": 1381170, "ts": 1295650952319.002, "dur": 534.930, "args": { "External id": 19158,"Record function id": 0, "Ev Idx": 1749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650952379.872, "dur": 6.063, "args": { "External id": 19159,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295650952402.178, "dur": 31.518, "args": { "External id": 19160,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952407.518, "dur": 1.766, "args": { "External id": 19161,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952411.856, "dur": 0.739, "args": { "External id": 19162,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952414.212, "dur": 0.398, "args": { "External id": 19163,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952416.141, "dur": 0.522, "args": { "External id": 19164,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952418.395, "dur": 0.394, "args": { "External id": 19165,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952420.501, "dur": 0.407, "args": { "External id": 19166,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952422.453, "dur": 1.422, "args": { "External id": 19167,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952425.832, "dur": 0.431, "args": { "External id": 19168,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952428.309, "dur": 0.385, "args": { "External id": 19169,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650952449.588, "dur": 35.649, "args": { "External id": 19170,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1761 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295650952520.833, "dur": 105.329, "args": { "External id": 19171,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 1762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650952531.417, "dur": 3.095, "args": { "External id": 19172,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295650952539.836, "dur": 10.821, "args": { "External id": 19173,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650952544.461, "dur": 5.788, "args": { "External id": 19174,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 1765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952548.578, "dur": 0.424, "args": { "External id": 19175,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295650952558.393, "dur": 25.915, "args": { "External id": 19176,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952561.012, "dur": 0.388, "args": { "External id": 19177,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952563.372, "dur": 0.484, "args": { "External id": 19178,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952565.484, "dur": 0.385, "args": { "External id": 19179,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952568.004, "dur": 1.299, "args": { "External id": 19180,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952571.261, "dur": 0.447, "args": { "External id": 19181,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952573.608, "dur": 0.335, "args": { "External id": 19182,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952575.580, "dur": 0.328, "args": { "External id": 19183,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952577.448, "dur": 0.405, "args": { "External id": 19184,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650952579.519, "dur": 0.473, "args": { "External id": 19185,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650952596.607, "dur": 20.705, "args": { "External id": 19186,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1777 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295650952674.936, "dur": 113.124, "args": { "External id": 19187,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 1778 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295650952697.452, "dur": 86.957, "args": { "External id": 19188,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1779, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295650952710.847, "dur": 69.470, "args": { "External id": 19189,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 1780 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295650952802.976, "dur": 1.840, "args": { "External id": 19190,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1781, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650952881.915, "dur": 1727.407, "args": { "External id": 19191,"Sequence number": 246594, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1782 } }, { "ph": "f", "id": 174, "pid": 1336757, "tid": 1381170, "ts": 1295650952881.915, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650953042.632, "dur": 104.827, "args": { "External id": 19192,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 1783 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295650953190.106, "dur": 54.088, "args": { "External id": 19193,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 1784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295650953265.113, "dur": 54.740, "args": { "External id": 19194,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 1785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650953330.292, "dur": 34.802, "args": { "External id": 19195,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650953373.565, "dur": 47.273, "args": { "External id": 19196,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650953429.220, "dur": 29.633, "args": { "External id": 19197,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650953466.244, "dur": 42.537, "args": { "External id": 19198,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1789 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295650953532.554, "dur": 23.031, "args": { "External id": 19199,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 1790 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295650953576.671, "dur": 28.039, "args": { "External id": 19200,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1791 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295650953626.790, "dur": 21.694, "args": { "External id": 19201,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1792 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295650953662.716, "dur": 16.449, "args": { "External id": 19202,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650953688.545, "dur": 29.957, "args": { "External id": 19203,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650953722.227, "dur": 34.081, "args": { "External id": 19204,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1795 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650953785.044, "dur": 171.332, "args": { "External id": 19205,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650953865.252, "dur": 5.425, "args": { "External id": 19206,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650953872.797, "dur": 2.315, "args": { "External id": 19207,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1798 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295650954035.231, "dur": 31.009, "args": { "External id": 19208,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1799 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295650954081.746, "dur": 16.397, "args": { "External id": 19209,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650954109.968, "dur": 46.542, "args": { "External id": 19210,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650954164.453, "dur": 52.072, "args": { "External id": 19211,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650954247.467, "dur": 34.471, "args": { "External id": 19212,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650954288.807, "dur": 33.962, "args": { "External id": 19213,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650954329.247, "dur": 21.743, "args": { "External id": 19214,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650954359.175, "dur": 29.937, "args": { "External id": 19215,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1806 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295650954409.691, "dur": 26.906, "args": { "External id": 19216,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 1807 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295650954456.805, "dur": 24.701, "args": { "External id": 19217,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1808 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295650954497.790, "dur": 21.673, "args": { "External id": 19218,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1809 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295650954532.972, "dur": 15.062, "args": { "External id": 19219,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1810 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295650954564.152, "dur": 16.200, "args": { "External id": 19220,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 1811 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954652.653, "dur": 14.597, "args": { "External id": 19221,"Record function id": 0, "Ev Idx": 1812 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954655.626, "dur": 10.759, "args": { "External id": 19222,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954659.402, "dur": 6.121, "args": { "External id": 19223,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1814 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954661.257, "dur": 4.133, "args": { "External id": 19224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1815 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954671.102, "dur": 5.661, "args": { "External id": 19225,"Record function id": 0, "Ev Idx": 1816 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954673.098, "dur": 3.118, "args": { "External id": 19226,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954673.900, "dur": 1.823, "args": { "External id": 19227,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1818 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954674.635, "dur": 1.015, "args": { "External id": 19228,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1819 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954680.122, "dur": 4.812, "args": { "External id": 19229,"Record function id": 0, "Ev Idx": 1820 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954681.634, "dur": 2.863, "args": { "External id": 19230,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954682.263, "dur": 1.812, "args": { "External id": 19231,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1822 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954682.843, "dur": 1.144, "args": { "External id": 19232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1823 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954688.244, "dur": 5.251, "args": { "External id": 19233,"Record function id": 0, "Ev Idx": 1824 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954689.584, "dur": 3.476, "args": { "External id": 19234,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954690.148, "dur": 2.493, "args": { "External id": 19235,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1826 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954690.452, "dur": 2.116, "args": { "External id": 19236,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1827 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954696.746, "dur": 4.008, "args": { "External id": 19237,"Record function id": 0, "Ev Idx": 1828 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954697.779, "dur": 2.566, "args": { "External id": 19238,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954698.366, "dur": 1.591, "args": { "External id": 19239,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1830 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954698.820, "dur": 1.065, "args": { "External id": 19240,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1831 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954704.008, "dur": 4.500, "args": { "External id": 19241,"Record function id": 0, "Ev Idx": 1832 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954705.535, "dur": 2.582, "args": { "External id": 19242,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954706.274, "dur": 1.327, "args": { "External id": 19243,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1834 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954706.766, "dur": 0.730, "args": { "External id": 19244,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1835 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954711.976, "dur": 4.289, "args": { "External id": 19245,"Record function id": 0, "Ev Idx": 1836 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954713.493, "dur": 2.358, "args": { "External id": 19246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954713.982, "dur": 1.451, "args": { "External id": 19247,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1838 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954714.493, "dur": 0.836, "args": { "External id": 19248,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1839 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954719.513, "dur": 3.355, "args": { "External id": 19249,"Record function id": 0, "Ev Idx": 1840 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954720.628, "dur": 1.843, "args": { "External id": 19250,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954721.106, "dur": 0.934, "args": { "External id": 19251,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1842 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954721.393, "dur": 0.569, "args": { "External id": 19252,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1843 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954725.916, "dur": 3.836, "args": { "External id": 19253,"Record function id": 0, "Ev Idx": 1844 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650954727.239, "dur": 2.120, "args": { "External id": 19254,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954727.695, "dur": 1.270, "args": { "External id": 19255,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1846 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650954728.232, "dur": 0.637, "args": { "External id": 19256,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1847 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650954733.392, "dur": 41741.539, "args": { "External id": 19257,"Record function id": 0, "Sequence number": 246593, "Fwd thread id": 1, "Ev Idx": 1848 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650954734.519, "dur": 41731.968, "args": { "External id": 19258,"Sequence number": 246593, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1849 } }, { "ph": "f", "id": 175, "pid": 1336757, "tid": 1381170, "ts": 1295650954734.519, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.26)", "pid": 1336757, "tid": 1381170, "ts": 1295650954761.865, "dur": 37.677, "args": { "External id": 19259,"Record function id": 0, "Ev Idx": 1850 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.26)", "pid": 1336757, "tid": 1381170, "ts": 1295650954807.141, "dur": 57.944, "args": { "External id": 19260,"Record function id": 0, "Ev Idx": 1851 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.26)", "pid": 1336757, "tid": 1381170, "ts": 1295650954870.883, "dur": 41588.165, "args": { "External id": 19261,"Record function id": 0, "Ev Idx": 1852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650954955.859, "dur": 6.490, "args": { "External id": 19262,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650954971.989, "dur": 4.583, "args": { "External id": 19263,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1854 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295650955041.551, "dur": 40544.723, "args": { "External id": 19264,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295650955056.287, "dur": 40520.833, "args": { "External id": 19265,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650955125.965, "dur": 15.669, "args": { "External id": 19266,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650955150.504, "dur": 40386.403, "args": { "External id": 19267,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 1858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650955152.999, "dur": 40383.225, "args": { "External id": 19268,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 1859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650955157.317, "dur": 5.645, "args": { "External id": 19269,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650955165.055, "dur": 40367.708, "args": { "External id": 19270,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 1861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295650995674.070, "dur": 8.890, "args": { "External id": 19271,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 1862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650995677.200, "dur": 5.449, "args": { "External id": 19272,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1863 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295650995713.465, "dur": 415.099, "args": { "External id": 19273,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 1864 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295650995740.487, "dur": 382.188, "args": { "External id": 19274,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1865, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295650995752.121, "dur": 363.995, "args": { "External id": 19275,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 1866 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295650996150.387, "dur": 2.266, "args": { "External id": 19276,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1867, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650996217.135, "dur": 6.705, "args": { "External id": 19277,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650996288.768, "dur": 2.067, "args": { "External id": 19278,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650996309.628, "dur": 0.909, "args": { "External id": 19279,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650996325.814, "dur": 0.774, "args": { "External id": 19280,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650996341.964, "dur": 0.882, "args": { "External id": 19281,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650996354.431, "dur": 1.124, "args": { "External id": 19282,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650996367.749, "dur": 1.144, "args": { "External id": 19283,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650996382.612, "dur": 2.188, "args": { "External id": 19284,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650996396.276, "dur": 0.941, "args": { "External id": 19285,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1876 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650996490.498, "dur": 2727.541, "args": { "External id": 19286,"Record function id": 0, "Ev Idx": 1877 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.25)", "pid": 1336757, "tid": 1381170, "ts": 1295650996508.686, "dur": 1035.965, "args": { "External id": 19287,"Record function id": 0, "Ev Idx": 1878 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.25)", "pid": 1336757, "tid": 1381170, "ts": 1295650996523.353, "dur": 311.896, "args": { "External id": 19288,"Record function id": 0, "Ev Idx": 1879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650996596.494, "dur": 4.132, "args": { "External id": 19289,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650996604.051, "dur": 1.033, "args": { "External id": 19290,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650996607.099, "dur": 0.850, "args": { "External id": 19291,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650996609.801, "dur": 1.917, "args": { "External id": 19292,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650996613.368, "dur": 0.894, "args": { "External id": 19293,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650996616.083, "dur": 0.762, "args": { "External id": 19294,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650996618.732, "dur": 1.860, "args": { "External id": 19295,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650996621.965, "dur": 1.184, "args": { "External id": 19296,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650996624.623, "dur": 0.727, "args": { "External id": 19297,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650996626.775, "dur": 0.925, "args": { "External id": 19298,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1889 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650996646.148, "dur": 155.699, "args": { "External id": 19299,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650996662.312, "dur": 135.055, "args": { "External id": 19300,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650996685.855, "dur": 11.761, "args": { "External id": 19301,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650996700.954, "dur": 68.927, "args": { "External id": 19302,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 1893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650996703.383, "dur": 66.149, "args": { "External id": 19303,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 1894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650996707.734, "dur": 8.474, "args": { "External id": 19304,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650996718.099, "dur": 50.692, "args": { "External id": 19305,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 1896 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.24", "pid": 1336757, "tid": 1381170, "ts": 1295650996911.942, "dur": 624.297, "args": { "External id": 19306,"Record function id": 0, "Ev Idx": 1897 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.24)", "pid": 1336757, "tid": 1381170, "ts": 1295650996929.313, "dur": 593.659, "args": { "External id": 19307,"Record function id": 0, "Ev Idx": 1898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650997033.746, "dur": 7.003, "args": { "External id": 19308,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295650997058.348, "dur": 32.327, "args": { "External id": 19309,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997063.718, "dur": 2.169, "args": { "External id": 19310,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997068.287, "dur": 0.398, "args": { "External id": 19311,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997070.578, "dur": 0.353, "args": { "External id": 19312,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997073.013, "dur": 0.421, "args": { "External id": 19313,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997075.433, "dur": 0.347, "args": { "External id": 19314,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997077.601, "dur": 0.679, "args": { "External id": 19315,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997079.901, "dur": 1.435, "args": { "External id": 19316,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997082.789, "dur": 0.351, "args": { "External id": 19317,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997085.075, "dur": 0.364, "args": { "External id": 19318,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650997100.958, "dur": 33.720, "args": { "External id": 19319,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1910 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295650997168.296, "dur": 128.208, "args": { "External id": 19320,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 1911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650997179.509, "dur": 3.250, "args": { "External id": 19321,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295650997187.865, "dur": 10.294, "args": { "External id": 19322,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295650997192.019, "dur": 5.759, "args": { "External id": 19323,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 1914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997196.008, "dur": 0.562, "args": { "External id": 19324,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295650997205.074, "dur": 48.494, "args": { "External id": 19325,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997207.337, "dur": 0.447, "args": { "External id": 19326,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997209.535, "dur": 0.405, "args": { "External id": 19327,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997220.371, "dur": 0.503, "args": { "External id": 19328,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997222.986, "dur": 1.163, "args": { "External id": 19329,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997225.705, "dur": 0.312, "args": { "External id": 19330,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997227.431, "dur": 13.919, "args": { "External id": 19331,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997244.401, "dur": 0.583, "args": { "External id": 19332,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997246.762, "dur": 0.334, "args": { "External id": 19333,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650997248.557, "dur": 0.372, "args": { "External id": 19334,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650997265.547, "dur": 21.954, "args": { "External id": 19335,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1926 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295650997346.751, "dur": 107.792, "args": { "External id": 19336,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 1927 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295650997368.670, "dur": 82.060, "args": { "External id": 19337,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1928, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295650997378.942, "dur": 67.802, "args": { "External id": 19338,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 1929 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295650997470.556, "dur": 1.876, "args": { "External id": 19339,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1930, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650997552.116, "dur": 1643.228, "args": { "External id": 19340,"Sequence number": 246592, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1931 } }, { "ph": "f", "id": 176, "pid": 1336757, "tid": 1381170, "ts": 1295650997552.116, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650997656.633, "dur": 99.110, "args": { "External id": 19341,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 1932 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295650997793.394, "dur": 39.809, "args": { "External id": 19342,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 1933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295650997850.407, "dur": 49.571, "args": { "External id": 19343,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 1934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650997909.393, "dur": 34.651, "args": { "External id": 19344,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650997952.369, "dur": 84.357, "args": { "External id": 19345,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650998048.339, "dur": 34.691, "args": { "External id": 19346,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650998098.440, "dur": 43.266, "args": { "External id": 19347,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1938 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295650998169.204, "dur": 23.462, "args": { "External id": 19348,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 1939 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295650998211.889, "dur": 43.804, "args": { "External id": 19349,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1940 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295650998280.638, "dur": 22.274, "args": { "External id": 19350,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1941 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295650998321.218, "dur": 15.306, "args": { "External id": 19351,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650998346.165, "dur": 35.074, "args": { "External id": 19352,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650998384.597, "dur": 34.151, "args": { "External id": 19353,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1944 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295650998445.151, "dur": 175.943, "args": { "External id": 19354,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650998529.340, "dur": 6.409, "args": { "External id": 19355,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650998538.237, "dur": 2.128, "args": { "External id": 19356,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1947 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295650998650.858, "dur": 25.360, "args": { "External id": 19357,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1948 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295650998687.151, "dur": 15.499, "args": { "External id": 19358,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650998710.281, "dur": 35.474, "args": { "External id": 19359,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650998752.279, "dur": 35.141, "args": { "External id": 19360,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650998795.429, "dur": 22.610, "args": { "External id": 19361,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650998823.526, "dur": 31.249, "args": { "External id": 19362,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650998861.094, "dur": 20.687, "args": { "External id": 19363,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295650998889.147, "dur": 42.179, "args": { "External id": 19364,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1955 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295650998954.560, "dur": 25.025, "args": { "External id": 19365,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 1956 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295650999035.517, "dur": 27.921, "args": { "External id": 19366,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1957 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295650999081.046, "dur": 22.064, "args": { "External id": 19367,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1958 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295650999118.737, "dur": 16.766, "args": { "External id": 19368,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1959 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295650999149.792, "dur": 17.261, "args": { "External id": 19369,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 1960 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999254.608, "dur": 17.766, "args": { "External id": 19370,"Record function id": 0, "Ev Idx": 1961 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999258.732, "dur": 12.419, "args": { "External id": 19371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999263.086, "dur": 6.730, "args": { "External id": 19372,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1963 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999264.807, "dur": 4.735, "args": { "External id": 19373,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1964 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999276.553, "dur": 5.045, "args": { "External id": 19374,"Record function id": 0, "Ev Idx": 1965 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999278.158, "dur": 2.970, "args": { "External id": 19375,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999278.795, "dur": 1.856, "args": { "External id": 19376,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1967 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999279.583, "dur": 0.944, "args": { "External id": 19377,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1968 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999284.819, "dur": 4.392, "args": { "External id": 19378,"Record function id": 0, "Ev Idx": 1969 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999286.207, "dur": 2.575, "args": { "External id": 19379,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999286.676, "dur": 1.604, "args": { "External id": 19380,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1971 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999287.255, "dur": 0.952, "args": { "External id": 19381,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1972 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999292.320, "dur": 5.642, "args": { "External id": 19382,"Record function id": 0, "Ev Idx": 1973 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999293.700, "dur": 3.795, "args": { "External id": 19383,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999294.337, "dur": 2.751, "args": { "External id": 19384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1975 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999295.174, "dur": 1.830, "args": { "External id": 19385,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1976 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999301.060, "dur": 3.535, "args": { "External id": 19386,"Record function id": 0, "Ev Idx": 1977 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999302.130, "dur": 2.045, "args": { "External id": 19387,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999302.707, "dur": 1.055, "args": { "External id": 19388,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1979 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999302.982, "dur": 0.701, "args": { "External id": 19389,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1980 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999307.675, "dur": 4.510, "args": { "External id": 19390,"Record function id": 0, "Ev Idx": 1981 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999309.082, "dur": 2.655, "args": { "External id": 19391,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999309.857, "dur": 1.442, "args": { "External id": 19392,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1983 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999310.542, "dur": 0.644, "args": { "External id": 19393,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1984 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999315.330, "dur": 3.701, "args": { "External id": 19394,"Record function id": 0, "Ev Idx": 1985 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999316.611, "dur": 2.000, "args": { "External id": 19395,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999317.082, "dur": 1.095, "args": { "External id": 19396,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1987 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999317.490, "dur": 0.590, "args": { "External id": 19397,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1988 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999322.119, "dur": 3.563, "args": { "External id": 19398,"Record function id": 0, "Ev Idx": 1989 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999323.412, "dur": 1.854, "args": { "External id": 19399,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999323.848, "dur": 1.014, "args": { "External id": 19400,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1991 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999324.237, "dur": 0.560, "args": { "External id": 19401,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1992 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999328.655, "dur": 3.377, "args": { "External id": 19402,"Record function id": 0, "Ev Idx": 1993 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295650999329.651, "dur": 1.964, "args": { "External id": 19403,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999330.144, "dur": 1.045, "args": { "External id": 19404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1995 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295650999330.663, "dur": 0.415, "args": { "External id": 19405,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1996 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650999335.372, "dur": 38987.374, "args": { "External id": 19406,"Record function id": 0, "Sequence number": 246591, "Fwd thread id": 1, "Ev Idx": 1997 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295650999336.645, "dur": 38976.633, "args": { "External id": 19407,"Sequence number": 246591, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1998 } }, { "ph": "f", "id": 177, "pid": 1336757, "tid": 1381170, "ts": 1295650999336.645, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.25)", "pid": 1336757, "tid": 1381170, "ts": 1295650999366.423, "dur": 36.713, "args": { "External id": 19408,"Record function id": 0, "Ev Idx": 1999 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.25)", "pid": 1336757, "tid": 1381170, "ts": 1295650999410.519, "dur": 57.739, "args": { "External id": 19409,"Record function id": 0, "Ev Idx": 2000 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.25)", "pid": 1336757, "tid": 1381170, "ts": 1295650999474.066, "dur": 38830.499, "args": { "External id": 19410,"Record function id": 0, "Ev Idx": 2001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650999560.616, "dur": 6.805, "args": { "External id": 19411,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295650999576.655, "dur": 4.569, "args": { "External id": 19412,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2003 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295650999595.744, "dur": 37890.514, "args": { "External id": 19413,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295650999609.036, "dur": 37868.195, "args": { "External id": 19414,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295650999669.347, "dur": 14.412, "args": { "External id": 19415,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295650999690.858, "dur": 37744.224, "args": { "External id": 19416,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295650999693.340, "dur": 37741.061, "args": { "External id": 19417,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295650999697.841, "dur": 4.710, "args": { "External id": 19418,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295650999704.593, "dur": 37726.098, "args": { "External id": 19419,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651037573.267, "dur": 9.723, "args": { "External id": 19420,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651037576.829, "dur": 5.861, "args": { "External id": 19421,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2012 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651037612.846, "dur": 326.518, "args": { "External id": 19422,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2013 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651037638.149, "dur": 296.503, "args": { "External id": 19423,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2014, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651037649.017, "dur": 280.477, "args": { "External id": 19424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2015 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651037956.658, "dur": 2.210, "args": { "External id": 19425,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2016, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038064.473, "dur": 7.072, "args": { "External id": 19426,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038118.620, "dur": 1.408, "args": { "External id": 19427,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038138.074, "dur": 0.935, "args": { "External id": 19428,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038153.291, "dur": 1.046, "args": { "External id": 19429,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038169.796, "dur": 0.884, "args": { "External id": 19430,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038182.210, "dur": 1.190, "args": { "External id": 19431,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038196.300, "dur": 1.089, "args": { "External id": 19432,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038211.009, "dur": 2.961, "args": { "External id": 19433,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038225.166, "dur": 1.228, "args": { "External id": 19434,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2025 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651038338.766, "dur": 2737.907, "args": { "External id": 19435,"Record function id": 0, "Ev Idx": 2026 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.24)", "pid": 1336757, "tid": 1381170, "ts": 1295651038356.240, "dur": 1021.970, "args": { "External id": 19436,"Record function id": 0, "Ev Idx": 2027 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.24)", "pid": 1336757, "tid": 1381170, "ts": 1295651038369.894, "dur": 309.261, "args": { "External id": 19437,"Record function id": 0, "Ev Idx": 2028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651038443.424, "dur": 4.256, "args": { "External id": 19438,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651038450.608, "dur": 1.206, "args": { "External id": 19439,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651038453.905, "dur": 1.073, "args": { "External id": 19440,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651038456.542, "dur": 2.590, "args": { "External id": 19441,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651038460.736, "dur": 1.065, "args": { "External id": 19442,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651038463.470, "dur": 0.930, "args": { "External id": 19443,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651038465.845, "dur": 2.182, "args": { "External id": 19444,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651038469.711, "dur": 0.773, "args": { "External id": 19445,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651038472.301, "dur": 1.023, "args": { "External id": 19446,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651038474.604, "dur": 0.901, "args": { "External id": 19447,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2038 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651038494.287, "dur": 153.885, "args": { "External id": 19448,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651038509.708, "dur": 134.152, "args": { "External id": 19449,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651038531.755, "dur": 11.901, "args": { "External id": 19450,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651038546.976, "dur": 68.152, "args": { "External id": 19451,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651038549.417, "dur": 65.351, "args": { "External id": 19452,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038553.746, "dur": 7.874, "args": { "External id": 19453,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651038563.475, "dur": 50.774, "args": { "External id": 19454,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2045 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.23", "pid": 1336757, "tid": 1381170, "ts": 1295651038752.309, "dur": 617.882, "args": { "External id": 19455,"Record function id": 0, "Ev Idx": 2046 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.23)", "pid": 1336757, "tid": 1381170, "ts": 1295651038769.046, "dur": 587.550, "args": { "External id": 19456,"Record function id": 0, "Ev Idx": 2047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651038845.699, "dur": 4.528, "args": { "External id": 19457,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651038865.551, "dur": 29.575, "args": { "External id": 19458,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038870.528, "dur": 1.749, "args": { "External id": 19459,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038874.388, "dur": 0.327, "args": { "External id": 19460,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038876.573, "dur": 0.406, "args": { "External id": 19461,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038878.750, "dur": 0.410, "args": { "External id": 19462,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038880.996, "dur": 0.403, "args": { "External id": 19463,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038883.142, "dur": 0.490, "args": { "External id": 19464,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038885.246, "dur": 1.182, "args": { "External id": 19465,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038888.125, "dur": 0.357, "args": { "External id": 19466,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651038890.208, "dur": 0.477, "args": { "External id": 19467,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651038904.949, "dur": 30.061, "args": { "External id": 19468,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2059 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651038965.376, "dur": 149.390, "args": { "External id": 19469,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651038975.685, "dur": 2.970, "args": { "External id": 19470,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651039022.069, "dur": 12.439, "args": { "External id": 19471,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651039026.941, "dur": 7.134, "args": { "External id": 19472,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651039031.460, "dur": 0.793, "args": { "External id": 19473,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651039043.432, "dur": 25.996, "args": { "External id": 19474,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651039046.574, "dur": 0.427, "args": { "External id": 19475,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651039048.725, "dur": 0.604, "args": { "External id": 19476,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651039051.140, "dur": 0.440, "args": { "External id": 19477,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651039053.024, "dur": 1.480, "args": { "External id": 19478,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651039056.163, "dur": 0.330, "args": { "External id": 19479,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651039058.293, "dur": 0.320, "args": { "External id": 19480,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651039060.151, "dur": 0.338, "args": { "External id": 19481,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651039062.016, "dur": 0.320, "args": { "External id": 19482,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651039063.995, "dur": 0.385, "args": { "External id": 19483,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651039083.449, "dur": 22.993, "args": { "External id": 19484,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2075 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651039163.959, "dur": 124.333, "args": { "External id": 19485,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2076 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651039185.565, "dur": 98.971, "args": { "External id": 19486,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2077, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651039195.245, "dur": 84.052, "args": { "External id": 19487,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2078 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651039303.755, "dur": 1.778, "args": { "External id": 19488,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2079, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651039385.551, "dur": 1671.269, "args": { "External id": 19489,"Sequence number": 246590, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2080 } }, { "ph": "f", "id": 178, "pid": 1336757, "tid": 1381170, "ts": 1295651039385.551, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651039496.559, "dur": 100.943, "args": { "External id": 19490,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2081 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651039636.470, "dur": 38.908, "args": { "External id": 19491,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651039691.966, "dur": 48.573, "args": { "External id": 19492,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651039750.084, "dur": 34.047, "args": { "External id": 19493,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651039792.700, "dur": 46.352, "args": { "External id": 19494,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651039846.566, "dur": 29.142, "args": { "External id": 19495,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651039882.693, "dur": 42.890, "args": { "External id": 19496,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2087 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651039946.524, "dur": 23.045, "args": { "External id": 19497,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2088 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651040042.717, "dur": 31.159, "args": { "External id": 19498,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2089 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651040096.307, "dur": 21.949, "args": { "External id": 19499,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2090 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651040131.982, "dur": 16.513, "args": { "External id": 19500,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651040157.731, "dur": 36.305, "args": { "External id": 19501,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651040197.562, "dur": 51.794, "args": { "External id": 19502,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2093 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651040293.932, "dur": 176.668, "args": { "External id": 19503,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651040376.219, "dur": 5.480, "args": { "External id": 19504,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651040384.186, "dur": 2.070, "args": { "External id": 19505,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2096 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651040502.334, "dur": 25.276, "args": { "External id": 19506,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2097 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651040538.567, "dur": 15.651, "args": { "External id": 19507,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651040562.661, "dur": 40.232, "args": { "External id": 19508,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651040609.735, "dur": 36.488, "args": { "External id": 19509,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651040656.078, "dur": 22.604, "args": { "External id": 19510,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651040684.128, "dur": 30.175, "args": { "External id": 19511,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651040720.539, "dur": 22.065, "args": { "External id": 19512,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651040749.778, "dur": 45.507, "args": { "External id": 19513,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2104 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651040817.247, "dur": 25.409, "args": { "External id": 19514,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2105 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651040859.162, "dur": 26.664, "args": { "External id": 19515,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2106 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651040900.475, "dur": 17.113, "args": { "External id": 19516,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2107 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651040931.295, "dur": 20.086, "args": { "External id": 19517,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2108 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651040964.936, "dur": 16.245, "args": { "External id": 19518,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2109 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041100.580, "dur": 15.443, "args": { "External id": 19519,"Record function id": 0, "Ev Idx": 2110 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041104.104, "dur": 11.132, "args": { "External id": 19520,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041108.300, "dur": 5.989, "args": { "External id": 19521,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2112 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041110.069, "dur": 4.100, "args": { "External id": 19522,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2113 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041119.963, "dur": 5.361, "args": { "External id": 19523,"Record function id": 0, "Ev Idx": 2114 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041121.490, "dur": 3.386, "args": { "External id": 19524,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041122.510, "dur": 1.920, "args": { "External id": 19525,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2116 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041123.366, "dur": 0.955, "args": { "External id": 19526,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2117 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041128.609, "dur": 4.635, "args": { "External id": 19527,"Record function id": 0, "Ev Idx": 2118 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041129.864, "dur": 2.972, "args": { "External id": 19528,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041130.843, "dur": 1.546, "args": { "External id": 19529,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2120 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041131.353, "dur": 0.965, "args": { "External id": 19530,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2121 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041136.449, "dur": 4.723, "args": { "External id": 19531,"Record function id": 0, "Ev Idx": 2122 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041137.695, "dur": 3.052, "args": { "External id": 19532,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041138.221, "dur": 2.099, "args": { "External id": 19533,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2124 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041138.655, "dur": 1.595, "args": { "External id": 19534,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2125 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041144.295, "dur": 3.841, "args": { "External id": 19535,"Record function id": 0, "Ev Idx": 2126 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041145.535, "dur": 2.180, "args": { "External id": 19536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041146.171, "dur": 1.072, "args": { "External id": 19537,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2128 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041146.487, "dur": 0.697, "args": { "External id": 19538,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2129 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041151.242, "dur": 3.966, "args": { "External id": 19539,"Record function id": 0, "Ev Idx": 2130 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041152.288, "dur": 2.473, "args": { "External id": 19540,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041152.895, "dur": 1.320, "args": { "External id": 19541,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2132 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041153.476, "dur": 0.631, "args": { "External id": 19542,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2133 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041158.426, "dur": 3.822, "args": { "External id": 19543,"Record function id": 0, "Ev Idx": 2134 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041159.647, "dur": 2.207, "args": { "External id": 19544,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041160.291, "dur": 1.131, "args": { "External id": 19545,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2136 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041160.761, "dur": 0.554, "args": { "External id": 19546,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2137 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041165.333, "dur": 3.343, "args": { "External id": 19547,"Record function id": 0, "Ev Idx": 2138 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041166.345, "dur": 1.916, "args": { "External id": 19548,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041166.810, "dur": 1.019, "args": { "External id": 19549,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2140 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041167.195, "dur": 0.563, "args": { "External id": 19550,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2141 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041171.820, "dur": 3.842, "args": { "External id": 19551,"Record function id": 0, "Ev Idx": 2142 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651041172.924, "dur": 2.330, "args": { "External id": 19552,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041173.599, "dur": 1.195, "args": { "External id": 19553,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2144 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651041174.158, "dur": 0.545, "args": { "External id": 19554,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2145 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651041179.187, "dur": 39045.808, "args": { "External id": 19555,"Record function id": 0, "Sequence number": 246589, "Fwd thread id": 1, "Ev Idx": 2146 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651041180.484, "dur": 39036.588, "args": { "External id": 19556,"Sequence number": 246589, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2147 } }, { "ph": "f", "id": 179, "pid": 1336757, "tid": 1381170, "ts": 1295651041180.484, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.24)", "pid": 1336757, "tid": 1381170, "ts": 1295651041208.108, "dur": 51.664, "args": { "External id": 19557,"Record function id": 0, "Ev Idx": 2148 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.24)", "pid": 1336757, "tid": 1381170, "ts": 1295651041269.126, "dur": 59.549, "args": { "External id": 19558,"Record function id": 0, "Ev Idx": 2149 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.24)", "pid": 1336757, "tid": 1381170, "ts": 1295651041334.785, "dur": 38874.812, "args": { "External id": 19559,"Record function id": 0, "Ev Idx": 2150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651041423.038, "dur": 7.077, "args": { "External id": 19560,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651041439.623, "dur": 4.917, "args": { "External id": 19561,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2152 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651041459.444, "dur": 37964.946, "args": { "External id": 19562,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651041472.647, "dur": 37942.365, "args": { "External id": 19563,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651041532.804, "dur": 14.486, "args": { "External id": 19564,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651041554.268, "dur": 37820.345, "args": { "External id": 19565,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651041556.779, "dur": 37816.998, "args": { "External id": 19566,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651041561.069, "dur": 4.618, "args": { "External id": 19567,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651041567.758, "dur": 37802.527, "args": { "External id": 19568,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651079514.266, "dur": 9.120, "args": { "External id": 19569,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651079517.904, "dur": 5.162, "args": { "External id": 19570,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2161 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651079552.927, "dur": 308.596, "args": { "External id": 19571,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2162 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651079581.136, "dur": 275.723, "args": { "External id": 19572,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2163, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651079592.754, "dur": 259.042, "args": { "External id": 19573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2164 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651079879.306, "dur": 2.152, "args": { "External id": 19574,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2165, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651079935.614, "dur": 6.350, "args": { "External id": 19575,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080036.552, "dur": 2.493, "args": { "External id": 19576,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080060.200, "dur": 1.249, "args": { "External id": 19577,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080075.940, "dur": 1.165, "args": { "External id": 19578,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080090.793, "dur": 0.828, "args": { "External id": 19579,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080104.081, "dur": 1.019, "args": { "External id": 19580,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080117.184, "dur": 1.463, "args": { "External id": 19581,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080131.864, "dur": 2.775, "args": { "External id": 19582,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080146.498, "dur": 1.043, "args": { "External id": 19583,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2174 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651080256.057, "dur": 2664.514, "args": { "External id": 19584,"Record function id": 0, "Ev Idx": 2175 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.23)", "pid": 1336757, "tid": 1381170, "ts": 1295651080276.531, "dur": 1002.826, "args": { "External id": 19585,"Record function id": 0, "Ev Idx": 2176 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.23)", "pid": 1336757, "tid": 1381170, "ts": 1295651080290.928, "dur": 321.044, "args": { "External id": 19586,"Record function id": 0, "Ev Idx": 2177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651080371.095, "dur": 4.746, "args": { "External id": 19587,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651080378.955, "dur": 1.119, "args": { "External id": 19588,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651080381.998, "dur": 1.066, "args": { "External id": 19589,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651080384.758, "dur": 2.252, "args": { "External id": 19590,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651080388.669, "dur": 1.230, "args": { "External id": 19591,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651080391.589, "dur": 1.102, "args": { "External id": 19592,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651080394.537, "dur": 2.221, "args": { "External id": 19593,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651080398.162, "dur": 1.015, "args": { "External id": 19594,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651080400.573, "dur": 0.891, "args": { "External id": 19595,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651080402.950, "dur": 0.965, "args": { "External id": 19596,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2187 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651080422.169, "dur": 154.634, "args": { "External id": 19597,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651080438.401, "dur": 133.860, "args": { "External id": 19598,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651080459.785, "dur": 12.012, "args": { "External id": 19599,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651080474.757, "dur": 68.546, "args": { "External id": 19600,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651080477.454, "dur": 65.523, "args": { "External id": 19601,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080481.524, "dur": 6.771, "args": { "External id": 19602,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651080490.566, "dur": 51.868, "args": { "External id": 19603,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2194 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.22", "pid": 1336757, "tid": 1381170, "ts": 1295651080689.235, "dur": 582.189, "args": { "External id": 19604,"Record function id": 0, "Ev Idx": 2195 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.22)", "pid": 1336757, "tid": 1381170, "ts": 1295651080707.205, "dur": 550.382, "args": { "External id": 19605,"Record function id": 0, "Ev Idx": 2196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651080759.458, "dur": 4.725, "args": { "External id": 19606,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651080779.033, "dur": 30.422, "args": { "External id": 19607,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080784.027, "dur": 1.403, "args": { "External id": 19608,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080787.955, "dur": 0.351, "args": { "External id": 19609,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080790.135, "dur": 0.622, "args": { "External id": 19610,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080792.911, "dur": 0.340, "args": { "External id": 19611,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080794.968, "dur": 0.577, "args": { "External id": 19612,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080797.263, "dur": 0.413, "args": { "External id": 19613,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080799.705, "dur": 1.390, "args": { "External id": 19614,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080802.942, "dur": 0.418, "args": { "External id": 19615,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080804.994, "dur": 0.413, "args": { "External id": 19616,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651080818.762, "dur": 28.843, "args": { "External id": 19617,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2208 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651080876.928, "dur": 99.536, "args": { "External id": 19618,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651080886.592, "dur": 3.110, "args": { "External id": 19619,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651080894.765, "dur": 11.300, "args": { "External id": 19620,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651080899.452, "dur": 6.190, "args": { "External id": 19621,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080903.688, "dur": 0.646, "args": { "External id": 19622,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651080913.021, "dur": 27.037, "args": { "External id": 19623,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080915.517, "dur": 0.423, "args": { "External id": 19624,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080918.475, "dur": 0.512, "args": { "External id": 19625,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080920.821, "dur": 0.417, "args": { "External id": 19626,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080923.447, "dur": 1.386, "args": { "External id": 19627,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080926.374, "dur": 0.450, "args": { "External id": 19628,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080928.592, "dur": 0.375, "args": { "External id": 19629,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080930.744, "dur": 0.556, "args": { "External id": 19630,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080933.017, "dur": 0.415, "args": { "External id": 19631,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651080934.928, "dur": 0.333, "args": { "External id": 19632,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651080949.416, "dur": 19.124, "args": { "External id": 19633,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2224 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651081062.793, "dur": 111.253, "args": { "External id": 19634,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2225 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651081085.573, "dur": 85.022, "args": { "External id": 19635,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2226, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651081095.649, "dur": 70.732, "args": { "External id": 19636,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2227 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651081187.815, "dur": 1.711, "args": { "External id": 19637,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2228, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651081286.908, "dur": 1613.560, "args": { "External id": 19638,"Sequence number": 246588, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2229 } }, { "ph": "f", "id": 180, "pid": 1336757, "tid": 1381170, "ts": 1295651081286.908, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651081397.024, "dur": 102.850, "args": { "External id": 19639,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2230 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651081538.776, "dur": 39.101, "args": { "External id": 19640,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651081594.907, "dur": 49.066, "args": { "External id": 19641,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651081654.147, "dur": 34.964, "args": { "External id": 19642,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651081697.494, "dur": 45.418, "args": { "External id": 19643,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651081750.214, "dur": 29.290, "args": { "External id": 19644,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651081788.026, "dur": 43.518, "args": { "External id": 19645,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2236 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651081852.866, "dur": 22.744, "args": { "External id": 19646,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2237 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651081893.606, "dur": 27.435, "args": { "External id": 19647,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2238 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651081938.841, "dur": 21.354, "args": { "External id": 19648,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2239 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651081974.889, "dur": 55.438, "args": { "External id": 19649,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651082042.671, "dur": 35.629, "args": { "External id": 19650,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651082082.022, "dur": 34.947, "args": { "External id": 19651,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2242 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651082144.842, "dur": 193.848, "args": { "External id": 19652,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651082225.957, "dur": 20.449, "args": { "External id": 19653,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651082249.863, "dur": 2.433, "args": { "External id": 19654,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2245 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651082372.048, "dur": 26.019, "args": { "External id": 19655,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2246 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651082409.468, "dur": 15.292, "args": { "External id": 19656,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651082433.599, "dur": 38.394, "args": { "External id": 19657,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651082479.003, "dur": 34.948, "args": { "External id": 19658,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651082540.723, "dur": 25.225, "args": { "External id": 19659,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651082572.314, "dur": 31.236, "args": { "External id": 19660,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651082610.723, "dur": 22.379, "args": { "External id": 19661,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651082640.851, "dur": 31.154, "args": { "External id": 19662,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2253 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651082701.020, "dur": 28.851, "args": { "External id": 19663,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2254 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651082747.911, "dur": 24.932, "args": { "External id": 19664,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2255 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651082786.785, "dur": 21.254, "args": { "External id": 19665,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2256 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651082824.461, "dur": 15.910, "args": { "External id": 19666,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2257 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651082854.205, "dur": 18.612, "args": { "External id": 19667,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2258 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651082942.320, "dur": 15.440, "args": { "External id": 19668,"Record function id": 0, "Ev Idx": 2259 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651082945.719, "dur": 11.113, "args": { "External id": 19669,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651082949.924, "dur": 6.041, "args": { "External id": 19670,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2261 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651082951.672, "dur": 4.120, "args": { "External id": 19671,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2262 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651082961.772, "dur": 4.886, "args": { "External id": 19672,"Record function id": 0, "Ev Idx": 2263 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651082963.085, "dur": 3.186, "args": { "External id": 19673,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651082963.901, "dur": 1.853, "args": { "External id": 19674,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2265 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651082964.521, "dur": 1.077, "args": { "External id": 19675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2266 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651082969.932, "dur": 5.376, "args": { "External id": 19676,"Record function id": 0, "Ev Idx": 2267 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651082971.372, "dur": 3.519, "args": { "External id": 19677,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651082972.230, "dur": 2.234, "args": { "External id": 19678,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2269 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651082972.975, "dur": 1.390, "args": { "External id": 19679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2270 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651082978.531, "dur": 55.634, "args": { "External id": 19680,"Record function id": 0, "Ev Idx": 2271 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651082979.762, "dur": 53.257, "args": { "External id": 19681,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083027.528, "dur": 4.387, "args": { "External id": 19682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2273 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083029.167, "dur": 2.496, "args": { "External id": 19683,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2274 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651083039.731, "dur": 5.042, "args": { "External id": 19684,"Record function id": 0, "Ev Idx": 2275 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651083041.360, "dur": 3.006, "args": { "External id": 19685,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083042.431, "dur": 1.481, "args": { "External id": 19686,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2277 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083043.031, "dur": 0.822, "args": { "External id": 19687,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2278 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651083047.924, "dur": 4.014, "args": { "External id": 19688,"Record function id": 0, "Ev Idx": 2279 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651083049.097, "dur": 2.437, "args": { "External id": 19689,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083049.782, "dur": 1.342, "args": { "External id": 19690,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2281 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083050.449, "dur": 0.576, "args": { "External id": 19691,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2282 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651083055.487, "dur": 3.809, "args": { "External id": 19692,"Record function id": 0, "Ev Idx": 2283 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651083056.861, "dur": 2.015, "args": { "External id": 19693,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083057.550, "dur": 0.903, "args": { "External id": 19694,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2285 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083057.852, "dur": 0.508, "args": { "External id": 19695,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2286 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651083062.482, "dur": 3.987, "args": { "External id": 19696,"Record function id": 0, "Ev Idx": 2287 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651083063.717, "dur": 2.321, "args": { "External id": 19697,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083064.544, "dur": 1.049, "args": { "External id": 19698,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2289 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083064.846, "dur": 0.687, "args": { "External id": 19699,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2290 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651083069.528, "dur": 3.807, "args": { "External id": 19700,"Record function id": 0, "Ev Idx": 2291 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651083070.838, "dur": 2.080, "args": { "External id": 19701,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083071.295, "dur": 1.200, "args": { "External id": 19702,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2293 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651083071.767, "dur": 0.633, "args": { "External id": 19703,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2294 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651083076.999, "dur": 37804.911, "args": { "External id": 19704,"Record function id": 0, "Sequence number": 246587, "Fwd thread id": 1, "Ev Idx": 2295 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651083078.546, "dur": 37795.643, "args": { "External id": 19705,"Sequence number": 246587, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2296 } }, { "ph": "f", "id": 181, "pid": 1336757, "tid": 1381170, "ts": 1295651083078.546, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.23)", "pid": 1336757, "tid": 1381170, "ts": 1295651083108.981, "dur": 36.052, "args": { "External id": 19706,"Record function id": 0, "Ev Idx": 2297 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.23)", "pid": 1336757, "tid": 1381170, "ts": 1295651083152.972, "dur": 57.659, "args": { "External id": 19707,"Record function id": 0, "Ev Idx": 2298 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.23)", "pid": 1336757, "tid": 1381170, "ts": 1295651083216.213, "dur": 37651.261, "args": { "External id": 19708,"Record function id": 0, "Ev Idx": 2299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651083318.403, "dur": 7.608, "args": { "External id": 19709,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651083335.998, "dur": 5.028, "args": { "External id": 19710,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2301 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651083356.513, "dur": 36752.592, "args": { "External id": 19711,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651083369.393, "dur": 36731.237, "args": { "External id": 19712,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651083423.219, "dur": 14.393, "args": { "External id": 19713,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651083444.151, "dur": 36616.819, "args": { "External id": 19714,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651083446.541, "dur": 36613.698, "args": { "External id": 19715,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651083450.496, "dur": 4.203, "args": { "External id": 19716,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651083456.437, "dur": 36600.245, "args": { "External id": 19717,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651120195.106, "dur": 9.532, "args": { "External id": 19718,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651120198.761, "dur": 5.494, "args": { "External id": 19719,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2310 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651120245.982, "dur": 336.235, "args": { "External id": 19720,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2311 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651120273.668, "dur": 303.854, "args": { "External id": 19721,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2312, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651120285.396, "dur": 286.687, "args": { "External id": 19722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2313 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651120600.119, "dur": 2.115, "args": { "External id": 19723,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2314, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651120659.749, "dur": 6.532, "args": { "External id": 19724,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651120711.706, "dur": 1.609, "args": { "External id": 19725,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651120730.266, "dur": 1.115, "args": { "External id": 19726,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651120744.810, "dur": 0.901, "args": { "External id": 19727,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651120757.763, "dur": 0.715, "args": { "External id": 19728,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651120769.675, "dur": 1.189, "args": { "External id": 19729,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651120782.112, "dur": 0.847, "args": { "External id": 19730,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651120794.141, "dur": 2.478, "args": { "External id": 19731,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651120807.459, "dur": 0.870, "args": { "External id": 19732,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2323 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651120896.113, "dur": 2750.132, "args": { "External id": 19733,"Record function id": 0, "Ev Idx": 2324 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.22)", "pid": 1336757, "tid": 1381170, "ts": 1295651120914.530, "dur": 1014.229, "args": { "External id": 19734,"Record function id": 0, "Ev Idx": 2325 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.22)", "pid": 1336757, "tid": 1381170, "ts": 1295651120929.362, "dur": 375.051, "args": { "External id": 19735,"Record function id": 0, "Ev Idx": 2326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651121040.526, "dur": 4.995, "args": { "External id": 19736,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651121049.390, "dur": 1.329, "args": { "External id": 19737,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651121052.545, "dur": 0.961, "args": { "External id": 19738,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651121055.212, "dur": 2.077, "args": { "External id": 19739,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651121058.904, "dur": 1.158, "args": { "External id": 19740,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651121061.782, "dur": 0.948, "args": { "External id": 19741,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651121064.418, "dur": 2.323, "args": { "External id": 19742,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651121068.257, "dur": 0.998, "args": { "External id": 19743,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651121070.979, "dur": 1.039, "args": { "External id": 19744,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651121073.664, "dur": 1.167, "args": { "External id": 19745,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2336 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651121093.270, "dur": 171.874, "args": { "External id": 19746,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651121108.919, "dur": 150.811, "args": { "External id": 19747,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651121132.013, "dur": 11.804, "args": { "External id": 19748,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651121146.953, "dur": 67.694, "args": { "External id": 19749,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651121149.941, "dur": 64.380, "args": { "External id": 19750,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121154.094, "dur": 7.916, "args": { "External id": 19751,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651121163.993, "dur": 49.846, "args": { "External id": 19752,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2343 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.21", "pid": 1336757, "tid": 1381170, "ts": 1295651121388.960, "dur": 531.861, "args": { "External id": 19753,"Record function id": 0, "Ev Idx": 2344 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.21)", "pid": 1336757, "tid": 1381170, "ts": 1295651121406.940, "dur": 500.509, "args": { "External id": 19754,"Record function id": 0, "Ev Idx": 2345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651121464.910, "dur": 5.307, "args": { "External id": 19755,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651121486.021, "dur": 30.595, "args": { "External id": 19756,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121490.887, "dur": 1.965, "args": { "External id": 19757,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121494.990, "dur": 0.478, "args": { "External id": 19758,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121497.355, "dur": 0.446, "args": { "External id": 19759,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121499.843, "dur": 0.449, "args": { "External id": 19760,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121502.155, "dur": 0.341, "args": { "External id": 19761,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121504.179, "dur": 0.460, "args": { "External id": 19762,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121506.420, "dur": 1.467, "args": { "External id": 19763,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121509.729, "dur": 0.358, "args": { "External id": 19764,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121511.849, "dur": 0.298, "args": { "External id": 19765,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651121530.906, "dur": 30.370, "args": { "External id": 19766,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2357 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651121592.144, "dur": 100.652, "args": { "External id": 19767,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651121602.709, "dur": 2.946, "args": { "External id": 19768,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651121610.608, "dur": 10.299, "args": { "External id": 19769,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651121614.923, "dur": 5.560, "args": { "External id": 19770,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121618.608, "dur": 0.590, "args": { "External id": 19771,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651121627.725, "dur": 26.327, "args": { "External id": 19772,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121630.276, "dur": 0.602, "args": { "External id": 19773,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121632.311, "dur": 0.525, "args": { "External id": 19774,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121634.398, "dur": 0.435, "args": { "External id": 19775,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121636.385, "dur": 1.417, "args": { "External id": 19776,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121639.876, "dur": 0.364, "args": { "External id": 19777,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121641.651, "dur": 0.593, "args": { "External id": 19778,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121644.212, "dur": 0.764, "args": { "External id": 19779,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121646.558, "dur": 0.362, "args": { "External id": 19780,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651121648.799, "dur": 0.325, "args": { "External id": 19781,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651121665.953, "dur": 18.942, "args": { "External id": 19782,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2373 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651121736.984, "dur": 106.517, "args": { "External id": 19783,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2374 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651121758.955, "dur": 81.079, "args": { "External id": 19784,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2375, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651121768.766, "dur": 67.408, "args": { "External id": 19785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2376 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651121858.477, "dur": 1.810, "args": { "External id": 19786,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2377, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651121936.793, "dur": 1685.510, "args": { "External id": 19787,"Sequence number": 246586, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2378 } }, { "ph": "f", "id": 182, "pid": 1336757, "tid": 1381170, "ts": 1295651121936.793, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651122084.488, "dur": 104.512, "args": { "External id": 19788,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2379 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651122227.260, "dur": 55.017, "args": { "External id": 19789,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651122302.744, "dur": 56.381, "args": { "External id": 19790,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651122369.396, "dur": 35.274, "args": { "External id": 19791,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651122411.956, "dur": 45.529, "args": { "External id": 19792,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651122465.539, "dur": 29.538, "args": { "External id": 19793,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651122502.411, "dur": 43.211, "args": { "External id": 19794,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2385 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651122568.974, "dur": 22.711, "args": { "External id": 19795,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2386 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651122618.664, "dur": 28.275, "args": { "External id": 19796,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2387 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651122666.777, "dur": 21.143, "args": { "External id": 19797,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2388 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651122701.408, "dur": 15.766, "args": { "External id": 19798,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651122726.192, "dur": 31.120, "args": { "External id": 19799,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651122760.425, "dur": 33.093, "args": { "External id": 19800,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2391 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651122820.575, "dur": 218.994, "args": { "External id": 19801,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651122899.423, "dur": 5.703, "args": { "External id": 19802,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651122907.336, "dur": 2.068, "args": { "External id": 19803,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2394 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651123075.229, "dur": 30.601, "args": { "External id": 19804,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2395 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651123116.824, "dur": 15.878, "args": { "External id": 19805,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651123142.824, "dur": 42.504, "args": { "External id": 19806,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651123192.363, "dur": 50.712, "args": { "External id": 19807,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651123255.055, "dur": 27.147, "args": { "External id": 19808,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651123288.397, "dur": 31.424, "args": { "External id": 19809,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651123326.909, "dur": 22.531, "args": { "External id": 19810,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651123356.808, "dur": 30.825, "args": { "External id": 19811,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2402 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651123415.870, "dur": 30.888, "args": { "External id": 19812,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2403 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651123466.771, "dur": 23.942, "args": { "External id": 19813,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2404 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651123504.434, "dur": 17.939, "args": { "External id": 19814,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2405 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651123540.257, "dur": 15.603, "args": { "External id": 19815,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2406 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651123574.170, "dur": 19.147, "args": { "External id": 19816,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2407 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123668.251, "dur": 15.640, "args": { "External id": 19817,"Record function id": 0, "Ev Idx": 2408 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123671.585, "dur": 11.334, "args": { "External id": 19818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123675.638, "dur": 6.332, "args": { "External id": 19819,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2410 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123677.554, "dur": 4.296, "args": { "External id": 19820,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2411 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123687.890, "dur": 6.044, "args": { "External id": 19821,"Record function id": 0, "Ev Idx": 2412 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123689.425, "dur": 4.058, "args": { "External id": 19822,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123690.524, "dur": 2.458, "args": { "External id": 19823,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2414 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123691.176, "dur": 1.697, "args": { "External id": 19824,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2415 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123697.117, "dur": 7.994, "args": { "External id": 19825,"Record function id": 0, "Ev Idx": 2416 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123698.441, "dur": 6.227, "args": { "External id": 19826,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123699.056, "dur": 5.173, "args": { "External id": 19827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2418 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123699.903, "dur": 4.263, "args": { "External id": 19828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2419 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123708.310, "dur": 4.021, "args": { "External id": 19829,"Record function id": 0, "Ev Idx": 2420 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123709.449, "dur": 2.435, "args": { "External id": 19830,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123710.058, "dur": 1.431, "args": { "External id": 19831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2422 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123710.425, "dur": 1.002, "args": { "External id": 19832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2423 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123715.437, "dur": 3.394, "args": { "External id": 19833,"Record function id": 0, "Ev Idx": 2424 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123716.362, "dur": 2.043, "args": { "External id": 19834,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123716.809, "dur": 1.216, "args": { "External id": 19835,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2426 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123717.238, "dur": 0.718, "args": { "External id": 19836,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2427 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123722.157, "dur": 3.385, "args": { "External id": 19837,"Record function id": 0, "Ev Idx": 2428 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123723.134, "dur": 1.976, "args": { "External id": 19838,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123723.651, "dur": 1.051, "args": { "External id": 19839,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2430 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123724.062, "dur": 0.527, "args": { "External id": 19840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2431 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123728.807, "dur": 3.306, "args": { "External id": 19841,"Record function id": 0, "Ev Idx": 2432 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123729.852, "dur": 1.833, "args": { "External id": 19842,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123730.306, "dur": 0.974, "args": { "External id": 19843,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2434 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123730.605, "dur": 0.583, "args": { "External id": 19844,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2435 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123735.270, "dur": 3.350, "args": { "External id": 19845,"Record function id": 0, "Ev Idx": 2436 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123736.417, "dur": 1.750, "args": { "External id": 19846,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123736.939, "dur": 0.834, "args": { "External id": 19847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2438 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123737.206, "dur": 0.497, "args": { "External id": 19848,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2439 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123741.699, "dur": 4.001, "args": { "External id": 19849,"Record function id": 0, "Ev Idx": 2440 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651123742.680, "dur": 2.593, "args": { "External id": 19850,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123743.314, "dur": 1.584, "args": { "External id": 19851,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2442 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651123743.828, "dur": 0.981, "args": { "External id": 19852,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2443 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651123749.489, "dur": 36692.958, "args": { "External id": 19853,"Record function id": 0, "Sequence number": 246585, "Fwd thread id": 1, "Ev Idx": 2444 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651123750.961, "dur": 36682.720, "args": { "External id": 19854,"Sequence number": 246585, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2445 } }, { "ph": "f", "id": 183, "pid": 1336757, "tid": 1381170, "ts": 1295651123750.961, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.22)", "pid": 1336757, "tid": 1381170, "ts": 1295651123779.358, "dur": 36.488, "args": { "External id": 19855,"Record function id": 0, "Ev Idx": 2446 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.22)", "pid": 1336757, "tid": 1381170, "ts": 1295651123823.409, "dur": 59.886, "args": { "External id": 19856,"Record function id": 0, "Ev Idx": 2447 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.22)", "pid": 1336757, "tid": 1381170, "ts": 1295651123888.956, "dur": 36536.449, "args": { "External id": 19857,"Record function id": 0, "Ev Idx": 2448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651123973.336, "dur": 6.424, "args": { "External id": 19858,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651124039.156, "dur": 5.323, "args": { "External id": 19859,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2450 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651124060.427, "dur": 35570.285, "args": { "External id": 19860,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651124074.039, "dur": 35548.108, "args": { "External id": 19861,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651124127.712, "dur": 14.310, "args": { "External id": 19862,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651124148.347, "dur": 35434.789, "args": { "External id": 19863,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651124151.013, "dur": 35431.544, "args": { "External id": 19864,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651124154.734, "dur": 6.788, "args": { "External id": 19865,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651124163.654, "dur": 35415.425, "args": { "External id": 19866,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651159716.768, "dur": 9.793, "args": { "External id": 19867,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651159720.377, "dur": 5.803, "args": { "External id": 19868,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2459 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651159754.564, "dur": 366.510, "args": { "External id": 19869,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2460 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651159780.073, "dur": 335.864, "args": { "External id": 19870,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2461, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651159791.081, "dur": 319.167, "args": { "External id": 19871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2462 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651160141.130, "dur": 2.700, "args": { "External id": 19872,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2463, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160200.489, "dur": 6.531, "args": { "External id": 19873,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160267.669, "dur": 2.414, "args": { "External id": 19874,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160288.420, "dur": 0.928, "args": { "External id": 19875,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160301.388, "dur": 1.356, "args": { "External id": 19876,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160315.130, "dur": 1.149, "args": { "External id": 19877,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160327.090, "dur": 1.226, "args": { "External id": 19878,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160340.150, "dur": 1.074, "args": { "External id": 19879,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160352.402, "dur": 2.783, "args": { "External id": 19880,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160365.216, "dur": 1.187, "args": { "External id": 19881,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2472 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651160457.047, "dur": 2707.688, "args": { "External id": 19882,"Record function id": 0, "Ev Idx": 2473 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.21)", "pid": 1336757, "tid": 1381170, "ts": 1295651160475.145, "dur": 1020.524, "args": { "External id": 19883,"Record function id": 0, "Ev Idx": 2474 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.21)", "pid": 1336757, "tid": 1381170, "ts": 1295651160489.569, "dur": 315.856, "args": { "External id": 19884,"Record function id": 0, "Ev Idx": 2475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651160562.668, "dur": 4.154, "args": { "External id": 19885,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651160570.326, "dur": 1.095, "args": { "External id": 19886,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651160573.488, "dur": 1.012, "args": { "External id": 19887,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651160576.083, "dur": 1.552, "args": { "External id": 19888,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651160579.348, "dur": 1.252, "args": { "External id": 19889,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651160582.119, "dur": 1.176, "args": { "External id": 19890,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651160587.058, "dur": 2.235, "args": { "External id": 19891,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651160591.022, "dur": 0.914, "args": { "External id": 19892,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651160593.202, "dur": 1.473, "args": { "External id": 19893,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651160596.101, "dur": 0.834, "args": { "External id": 19894,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2485 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651160616.117, "dur": 156.984, "args": { "External id": 19895,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651160640.557, "dur": 127.949, "args": { "External id": 19896,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651160656.906, "dur": 12.245, "args": { "External id": 19897,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651160672.066, "dur": 67.152, "args": { "External id": 19898,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651160674.679, "dur": 64.144, "args": { "External id": 19899,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160678.933, "dur": 6.864, "args": { "External id": 19900,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651160687.863, "dur": 50.434, "args": { "External id": 19901,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2492 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.20", "pid": 1336757, "tid": 1381170, "ts": 1295651160882.460, "dur": 606.207, "args": { "External id": 19902,"Record function id": 0, "Ev Idx": 2493 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.20)", "pid": 1336757, "tid": 1381170, "ts": 1295651160898.352, "dur": 577.716, "args": { "External id": 19903,"Record function id": 0, "Ev Idx": 2494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651160951.608, "dur": 4.771, "args": { "External id": 19904,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651160971.668, "dur": 83.144, "args": { "External id": 19905,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160976.759, "dur": 1.328, "args": { "External id": 19906,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651160980.339, "dur": 50.341, "args": { "External id": 19907,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161034.166, "dur": 0.921, "args": { "External id": 19908,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161036.842, "dur": 0.950, "args": { "External id": 19909,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161039.432, "dur": 0.682, "args": { "External id": 19910,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161041.721, "dur": 0.658, "args": { "External id": 19911,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161044.216, "dur": 0.517, "args": { "External id": 19912,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161046.689, "dur": 0.538, "args": { "External id": 19913,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161048.899, "dur": 0.574, "args": { "External id": 19914,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651161064.545, "dur": 31.648, "args": { "External id": 19915,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2506 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651161131.047, "dur": 115.410, "args": { "External id": 19916,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651161141.887, "dur": 4.294, "args": { "External id": 19917,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651161151.304, "dur": 10.627, "args": { "External id": 19918,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651161155.351, "dur": 6.185, "args": { "External id": 19919,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161158.975, "dur": 1.114, "args": { "External id": 19920,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651161169.166, "dur": 26.729, "args": { "External id": 19921,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161171.233, "dur": 0.575, "args": { "External id": 19922,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161173.809, "dur": 0.717, "args": { "External id": 19923,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161176.357, "dur": 0.681, "args": { "External id": 19924,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161178.831, "dur": 0.676, "args": { "External id": 19925,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161181.264, "dur": 0.562, "args": { "External id": 19926,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161183.628, "dur": 0.634, "args": { "External id": 19927,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161185.759, "dur": 0.633, "args": { "External id": 19928,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161188.429, "dur": 0.681, "args": { "External id": 19929,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651161190.894, "dur": 0.624, "args": { "External id": 19930,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651161206.066, "dur": 18.116, "args": { "External id": 19931,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2522 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651161295.063, "dur": 113.669, "args": { "External id": 19932,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2523 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651161320.863, "dur": 84.499, "args": { "External id": 19933,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2524, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651161330.552, "dur": 70.840, "args": { "External id": 19934,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2525 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651161423.809, "dur": 1.916, "args": { "External id": 19935,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2526, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651161502.753, "dur": 1640.193, "args": { "External id": 19936,"Sequence number": 246584, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2527 } }, { "ph": "f", "id": 184, "pid": 1336757, "tid": 1381170, "ts": 1295651161502.753, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651161608.001, "dur": 100.064, "args": { "External id": 19937,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2528 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651161748.239, "dur": 38.947, "args": { "External id": 19938,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651161803.462, "dur": 47.795, "args": { "External id": 19939,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651161860.804, "dur": 33.684, "args": { "External id": 19940,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651161901.608, "dur": 44.355, "args": { "External id": 19941,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651161952.954, "dur": 67.328, "args": { "External id": 19942,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651162032.070, "dur": 47.972, "args": { "External id": 19943,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2534 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651162107.862, "dur": 24.187, "args": { "External id": 19944,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2535 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651162151.714, "dur": 28.534, "args": { "External id": 19945,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2536 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651162201.238, "dur": 21.608, "args": { "External id": 19946,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2537 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651162254.753, "dur": 18.885, "args": { "External id": 19947,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651162284.830, "dur": 35.218, "args": { "External id": 19948,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651162323.762, "dur": 34.705, "args": { "External id": 19949,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2540 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651162385.718, "dur": 170.811, "args": { "External id": 19950,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651162464.284, "dur": 5.661, "args": { "External id": 19951,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651162472.251, "dur": 2.314, "args": { "External id": 19952,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2543 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651162596.878, "dur": 26.265, "args": { "External id": 19953,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2544 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651162635.887, "dur": 15.566, "args": { "External id": 19954,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651162659.924, "dur": 35.833, "args": { "External id": 19955,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651162703.092, "dur": 36.412, "args": { "External id": 19956,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651162747.529, "dur": 23.742, "args": { "External id": 19957,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651162777.475, "dur": 30.715, "args": { "External id": 19958,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651162814.810, "dur": 22.640, "args": { "External id": 19959,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651162845.157, "dur": 30.448, "args": { "External id": 19960,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2551 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651162891.337, "dur": 22.447, "args": { "External id": 19961,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2552 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651162940.387, "dur": 29.877, "args": { "External id": 19962,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2553 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651163020.610, "dur": 21.668, "args": { "External id": 19963,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2554 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651163065.017, "dur": 16.572, "args": { "External id": 19964,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2555 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651163095.128, "dur": 16.159, "args": { "External id": 19965,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2556 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163186.745, "dur": 38.973, "args": { "External id": 19966,"Record function id": 0, "Ev Idx": 2557 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163190.065, "dur": 34.831, "args": { "External id": 19967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163194.002, "dur": 29.893, "args": { "External id": 19968,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2559 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163218.667, "dur": 5.079, "args": { "External id": 19969,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2560 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163245.611, "dur": 8.103, "args": { "External id": 19970,"Record function id": 0, "Ev Idx": 2561 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163247.555, "dur": 5.402, "args": { "External id": 19971,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163249.012, "dur": 3.058, "args": { "External id": 19972,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2563 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163249.889, "dur": 1.933, "args": { "External id": 19973,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2564 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163257.335, "dur": 4.139, "args": { "External id": 19974,"Record function id": 0, "Ev Idx": 2565 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163258.506, "dur": 2.525, "args": { "External id": 19975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163259.022, "dur": 1.566, "args": { "External id": 19976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2567 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163259.307, "dur": 1.200, "args": { "External id": 19977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2568 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163264.688, "dur": 3.572, "args": { "External id": 19978,"Record function id": 0, "Ev Idx": 2569 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163265.725, "dur": 2.138, "args": { "External id": 19979,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163266.227, "dur": 1.230, "args": { "External id": 19980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2571 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163266.501, "dur": 0.877, "args": { "External id": 19981,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2572 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163271.386, "dur": 4.100, "args": { "External id": 19982,"Record function id": 0, "Ev Idx": 2573 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163272.696, "dur": 2.386, "args": { "External id": 19983,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163273.225, "dur": 1.357, "args": { "External id": 19984,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2575 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163273.533, "dur": 0.987, "args": { "External id": 19985,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2576 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163278.696, "dur": 4.706, "args": { "External id": 19986,"Record function id": 0, "Ev Idx": 2577 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163279.898, "dur": 3.017, "args": { "External id": 19987,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163280.375, "dur": 2.098, "args": { "External id": 19988,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2579 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163281.019, "dur": 1.380, "args": { "External id": 19989,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2580 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163287.366, "dur": 3.667, "args": { "External id": 19990,"Record function id": 0, "Ev Idx": 2581 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163288.623, "dur": 1.984, "args": { "External id": 19991,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163289.150, "dur": 1.054, "args": { "External id": 19992,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2583 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163289.430, "dur": 0.698, "args": { "External id": 19993,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2584 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163294.099, "dur": 5.725, "args": { "External id": 19994,"Record function id": 0, "Ev Idx": 2585 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163295.294, "dur": 4.123, "args": { "External id": 19995,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163295.800, "dur": 3.132, "args": { "External id": 19996,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2587 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163298.098, "dur": 0.737, "args": { "External id": 19997,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2588 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163302.898, "dur": 3.426, "args": { "External id": 19998,"Record function id": 0, "Ev Idx": 2589 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651163303.953, "dur": 1.932, "args": { "External id": 19999,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163304.475, "dur": 1.013, "args": { "External id": 20000,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2591 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651163304.755, "dur": 0.657, "args": { "External id": 20001,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2592 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651163310.171, "dur": 38248.418, "args": { "External id": 20002,"Record function id": 0, "Sequence number": 246583, "Fwd thread id": 1, "Ev Idx": 2593 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651163311.451, "dur": 38239.018, "args": { "External id": 20003,"Sequence number": 246583, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2594 } }, { "ph": "f", "id": 185, "pid": 1336757, "tid": 1381170, "ts": 1295651163311.451, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.21)", "pid": 1336757, "tid": 1381170, "ts": 1295651163341.561, "dur": 37.132, "args": { "External id": 20004,"Record function id": 0, "Ev Idx": 2595 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.21)", "pid": 1336757, "tid": 1381170, "ts": 1295651163386.156, "dur": 56.869, "args": { "External id": 20005,"Record function id": 0, "Ev Idx": 2596 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.21)", "pid": 1336757, "tid": 1381170, "ts": 1295651163448.930, "dur": 38093.470, "args": { "External id": 20006,"Record function id": 0, "Ev Idx": 2597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651163534.164, "dur": 6.969, "args": { "External id": 20007,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651163550.144, "dur": 4.872, "args": { "External id": 20008,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2599 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651163572.763, "dur": 37134.131, "args": { "External id": 20009,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651163585.571, "dur": 37112.854, "args": { "External id": 20010,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651163632.266, "dur": 14.373, "args": { "External id": 20011,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651163652.789, "dur": 37003.672, "args": { "External id": 20012,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651163655.179, "dur": 37000.544, "args": { "External id": 20013,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651163658.800, "dur": 5.303, "args": { "External id": 20014,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651163666.077, "dur": 36985.882, "args": { "External id": 20015,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651200794.082, "dur": 9.483, "args": { "External id": 20016,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651200797.066, "dur": 6.155, "args": { "External id": 20017,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2608 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651200833.613, "dur": 427.093, "args": { "External id": 20018,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2609 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651200858.963, "dur": 396.076, "args": { "External id": 20019,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2610, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651200869.568, "dur": 378.432, "args": { "External id": 20020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2611 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651201282.464, "dur": 2.962, "args": { "External id": 20021,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2612, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651201347.499, "dur": 6.867, "args": { "External id": 20022,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651201399.790, "dur": 1.586, "args": { "External id": 20023,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651201417.029, "dur": 1.098, "args": { "External id": 20024,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651201428.537, "dur": 1.050, "args": { "External id": 20025,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651201440.672, "dur": 1.231, "args": { "External id": 20026,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651201451.382, "dur": 1.074, "args": { "External id": 20027,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651201462.467, "dur": 1.124, "args": { "External id": 20028,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651201474.249, "dur": 2.087, "args": { "External id": 20029,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651201485.368, "dur": 1.103, "args": { "External id": 20030,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2621 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651201572.400, "dur": 2676.489, "args": { "External id": 20031,"Record function id": 0, "Ev Idx": 2622 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.20)", "pid": 1336757, "tid": 1381170, "ts": 1295651201590.064, "dur": 989.848, "args": { "External id": 20032,"Record function id": 0, "Ev Idx": 2623 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.20)", "pid": 1336757, "tid": 1381170, "ts": 1295651201604.295, "dur": 307.252, "args": { "External id": 20033,"Record function id": 0, "Ev Idx": 2624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651201676.975, "dur": 4.023, "args": { "External id": 20034,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651201683.996, "dur": 1.989, "args": { "External id": 20035,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651201687.642, "dur": 1.394, "args": { "External id": 20036,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651201690.383, "dur": 1.400, "args": { "External id": 20037,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651201693.342, "dur": 1.460, "args": { "External id": 20038,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651201696.235, "dur": 1.308, "args": { "External id": 20039,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651201699.523, "dur": 2.827, "args": { "External id": 20040,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651201703.601, "dur": 1.319, "args": { "External id": 20041,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651201706.568, "dur": 1.403, "args": { "External id": 20042,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651201709.404, "dur": 1.123, "args": { "External id": 20043,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2634 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651201727.451, "dur": 153.363, "args": { "External id": 20044,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651201742.334, "dur": 134.330, "args": { "External id": 20045,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651201760.423, "dur": 11.364, "args": { "External id": 20046,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651201774.911, "dur": 66.527, "args": { "External id": 20047,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651201777.620, "dur": 63.469, "args": { "External id": 20048,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651201781.422, "dur": 7.187, "args": { "External id": 20049,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651201790.606, "dur": 49.814, "args": { "External id": 20050,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2641 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.19", "pid": 1336757, "tid": 1381170, "ts": 1295651201978.960, "dur": 592.486, "args": { "External id": 20051,"Record function id": 0, "Ev Idx": 2642 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.19)", "pid": 1336757, "tid": 1381170, "ts": 1295651202035.478, "dur": 523.590, "args": { "External id": 20052,"Record function id": 0, "Ev Idx": 2643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651202093.298, "dur": 6.454, "args": { "External id": 20053,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651202115.936, "dur": 32.100, "args": { "External id": 20054,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202120.547, "dur": 2.570, "args": { "External id": 20055,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202125.244, "dur": 0.940, "args": { "External id": 20056,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202127.730, "dur": 0.856, "args": { "External id": 20057,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202129.959, "dur": 0.538, "args": { "External id": 20058,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202132.096, "dur": 0.713, "args": { "External id": 20059,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202134.647, "dur": 0.820, "args": { "External id": 20060,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202136.977, "dur": 0.937, "args": { "External id": 20061,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202139.491, "dur": 0.541, "args": { "External id": 20062,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202141.456, "dur": 0.650, "args": { "External id": 20063,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651202157.764, "dur": 32.348, "args": { "External id": 20064,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2655 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651202221.488, "dur": 126.939, "args": { "External id": 20065,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651202247.607, "dur": 4.390, "args": { "External id": 20066,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651202257.785, "dur": 11.469, "args": { "External id": 20067,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651202262.017, "dur": 6.795, "args": { "External id": 20068,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202265.868, "dur": 1.155, "args": { "External id": 20069,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651202277.241, "dur": 29.192, "args": { "External id": 20070,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202279.929, "dur": 0.753, "args": { "External id": 20071,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202282.613, "dur": 0.801, "args": { "External id": 20072,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202284.976, "dur": 0.704, "args": { "External id": 20073,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202287.501, "dur": 0.789, "args": { "External id": 20074,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202289.883, "dur": 0.885, "args": { "External id": 20075,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202292.382, "dur": 0.909, "args": { "External id": 20076,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202294.881, "dur": 1.004, "args": { "External id": 20077,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202297.195, "dur": 0.797, "args": { "External id": 20078,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651202299.688, "dur": 1.183, "args": { "External id": 20079,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651202318.393, "dur": 21.474, "args": { "External id": 20080,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2671 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651202393.949, "dur": 104.618, "args": { "External id": 20081,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2672 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651202414.330, "dur": 80.697, "args": { "External id": 20082,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2673, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651202423.725, "dur": 66.852, "args": { "External id": 20083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2674 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651202510.196, "dur": 1.771, "args": { "External id": 20084,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2675, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651202586.536, "dur": 1627.943, "args": { "External id": 20085,"Sequence number": 246582, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2676 } }, { "ph": "f", "id": 186, "pid": 1336757, "tid": 1381170, "ts": 1295651202586.536, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651202690.286, "dur": 99.245, "args": { "External id": 20086,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2677 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651202824.689, "dur": 38.970, "args": { "External id": 20087,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651202881.546, "dur": 49.786, "args": { "External id": 20088,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651202941.390, "dur": 35.295, "args": { "External id": 20089,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651203025.925, "dur": 53.152, "args": { "External id": 20090,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651203089.547, "dur": 29.960, "args": { "External id": 20091,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651203127.736, "dur": 42.749, "args": { "External id": 20092,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2683 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651203195.932, "dur": 24.424, "args": { "External id": 20093,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2684 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651203254.513, "dur": 30.925, "args": { "External id": 20094,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2685 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651203305.382, "dur": 20.607, "args": { "External id": 20095,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2686 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651203339.080, "dur": 16.954, "args": { "External id": 20096,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651203366.007, "dur": 35.888, "args": { "External id": 20097,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651203405.192, "dur": 36.725, "args": { "External id": 20098,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2689 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651203470.681, "dur": 170.063, "args": { "External id": 20099,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651203548.627, "dur": 5.863, "args": { "External id": 20100,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651203556.521, "dur": 2.137, "args": { "External id": 20101,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2692 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651203670.991, "dur": 25.308, "args": { "External id": 20102,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2693 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651203707.039, "dur": 15.095, "args": { "External id": 20103,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651203730.606, "dur": 35.270, "args": { "External id": 20104,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651203772.541, "dur": 36.920, "args": { "External id": 20105,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651203816.976, "dur": 23.440, "args": { "External id": 20106,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651203846.680, "dur": 30.227, "args": { "External id": 20107,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651203883.238, "dur": 21.606, "args": { "External id": 20108,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651203912.596, "dur": 30.295, "args": { "External id": 20109,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2700 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651203958.655, "dur": 23.416, "args": { "External id": 20110,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2701 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651204035.329, "dur": 42.353, "args": { "External id": 20111,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2702 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651204098.001, "dur": 19.037, "args": { "External id": 20112,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2703 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651204133.001, "dur": 20.215, "args": { "External id": 20113,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2704 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651204166.426, "dur": 16.756, "args": { "External id": 20114,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2705 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204272.095, "dur": 16.813, "args": { "External id": 20115,"Record function id": 0, "Ev Idx": 2706 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204275.776, "dur": 12.099, "args": { "External id": 20116,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204280.064, "dur": 6.599, "args": { "External id": 20117,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2708 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204282.069, "dur": 4.511, "args": { "External id": 20118,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2709 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204292.801, "dur": 4.725, "args": { "External id": 20119,"Record function id": 0, "Ev Idx": 2710 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204294.174, "dur": 2.885, "args": { "External id": 20120,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204294.919, "dur": 1.705, "args": { "External id": 20121,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2712 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204295.479, "dur": 1.057, "args": { "External id": 20122,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2713 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204300.789, "dur": 5.459, "args": { "External id": 20123,"Record function id": 0, "Ev Idx": 2714 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204302.841, "dur": 2.939, "args": { "External id": 20124,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204303.841, "dur": 1.536, "args": { "External id": 20125,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2716 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204304.267, "dur": 1.040, "args": { "External id": 20126,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2717 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204309.415, "dur": 4.240, "args": { "External id": 20127,"Record function id": 0, "Ev Idx": 2718 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204310.476, "dur": 2.707, "args": { "External id": 20128,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204311.101, "dur": 1.682, "args": { "External id": 20129,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2720 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204311.752, "dur": 0.899, "args": { "External id": 20130,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2721 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204316.838, "dur": 3.853, "args": { "External id": 20131,"Record function id": 0, "Ev Idx": 2722 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204318.143, "dur": 2.099, "args": { "External id": 20132,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204318.826, "dur": 0.981, "args": { "External id": 20133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2724 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204319.113, "dur": 0.622, "args": { "External id": 20134,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2725 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204323.920, "dur": 3.639, "args": { "External id": 20135,"Record function id": 0, "Ev Idx": 2726 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204324.966, "dur": 2.125, "args": { "External id": 20136,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204325.606, "dur": 1.098, "args": { "External id": 20137,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2728 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204325.892, "dur": 0.693, "args": { "External id": 20138,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2729 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204330.930, "dur": 4.294, "args": { "External id": 20139,"Record function id": 0, "Ev Idx": 2730 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204332.119, "dur": 2.687, "args": { "External id": 20140,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204332.753, "dur": 1.639, "args": { "External id": 20141,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2732 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204333.432, "dur": 0.852, "args": { "External id": 20142,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2733 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204338.304, "dur": 3.953, "args": { "External id": 20143,"Record function id": 0, "Ev Idx": 2734 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204339.536, "dur": 2.296, "args": { "External id": 20144,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204340.097, "dur": 1.267, "args": { "External id": 20145,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2736 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204340.465, "dur": 0.837, "args": { "External id": 20146,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2737 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204345.375, "dur": 3.691, "args": { "External id": 20147,"Record function id": 0, "Ev Idx": 2738 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651204346.319, "dur": 2.296, "args": { "External id": 20148,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204346.817, "dur": 1.387, "args": { "External id": 20149,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2740 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651204347.108, "dur": 1.004, "args": { "External id": 20150,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2741 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651204352.472, "dur": 35558.743, "args": { "External id": 20151,"Record function id": 0, "Sequence number": 246581, "Fwd thread id": 1, "Ev Idx": 2742 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651204353.628, "dur": 35549.494, "args": { "External id": 20152,"Sequence number": 246581, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2743 } }, { "ph": "f", "id": 187, "pid": 1336757, "tid": 1381170, "ts": 1295651204353.628, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.20)", "pid": 1336757, "tid": 1381170, "ts": 1295651204382.138, "dur": 36.661, "args": { "External id": 20153,"Record function id": 0, "Ev Idx": 2744 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.20)", "pid": 1336757, "tid": 1381170, "ts": 1295651204426.607, "dur": 57.397, "args": { "External id": 20154,"Record function id": 0, "Ev Idx": 2745 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.20)", "pid": 1336757, "tid": 1381170, "ts": 1295651204491.090, "dur": 35404.870, "args": { "External id": 20155,"Record function id": 0, "Ev Idx": 2746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651204576.617, "dur": 6.345, "args": { "External id": 20156,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651204591.942, "dur": 4.716, "args": { "External id": 20157,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2748 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651204610.641, "dur": 34537.584, "args": { "External id": 20158,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651204623.315, "dur": 34515.649, "args": { "External id": 20159,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651204690.691, "dur": 13.262, "args": { "External id": 20160,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651204710.211, "dur": 34389.378, "args": { "External id": 20161,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651204712.928, "dur": 34385.540, "args": { "External id": 20162,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651204716.701, "dur": 5.063, "args": { "External id": 20163,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651204723.652, "dur": 34371.088, "args": { "External id": 20164,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651239250.546, "dur": 10.632, "args": { "External id": 20165,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651239254.215, "dur": 6.470, "args": { "External id": 20166,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2757 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651239294.687, "dur": 334.892, "args": { "External id": 20167,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2758 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651239323.370, "dur": 301.535, "args": { "External id": 20168,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2759, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651239335.057, "dur": 284.689, "args": { "External id": 20169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2760 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651239647.517, "dur": 2.179, "args": { "External id": 20170,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2761, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651239704.310, "dur": 6.602, "args": { "External id": 20171,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651239753.600, "dur": 1.639, "args": { "External id": 20172,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651239771.093, "dur": 0.771, "args": { "External id": 20173,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651239782.576, "dur": 1.316, "args": { "External id": 20174,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651239794.916, "dur": 0.699, "args": { "External id": 20175,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651239805.324, "dur": 0.850, "args": { "External id": 20176,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651239816.367, "dur": 0.854, "args": { "External id": 20177,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651239827.933, "dur": 2.081, "args": { "External id": 20178,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651239839.099, "dur": 0.816, "args": { "External id": 20179,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2770 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651239924.787, "dur": 2711.035, "args": { "External id": 20180,"Record function id": 0, "Ev Idx": 2771 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.19)", "pid": 1336757, "tid": 1381170, "ts": 1295651239942.868, "dur": 993.236, "args": { "External id": 20181,"Record function id": 0, "Ev Idx": 2772 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.19)", "pid": 1336757, "tid": 1381170, "ts": 1295651239956.591, "dur": 384.208, "args": { "External id": 20182,"Record function id": 0, "Ev Idx": 2773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651240081.985, "dur": 4.798, "args": { "External id": 20183,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651240090.098, "dur": 1.274, "args": { "External id": 20184,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651240093.097, "dur": 1.005, "args": { "External id": 20185,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651240096.234, "dur": 0.985, "args": { "External id": 20186,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651240098.635, "dur": 1.178, "args": { "External id": 20187,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651240103.829, "dur": 0.762, "args": { "External id": 20188,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651240106.136, "dur": 2.651, "args": { "External id": 20189,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651240111.877, "dur": 0.733, "args": { "External id": 20190,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651240114.227, "dur": 1.142, "args": { "External id": 20191,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651240116.603, "dur": 1.029, "args": { "External id": 20192,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2783 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651240135.663, "dur": 167.276, "args": { "External id": 20193,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651240152.322, "dur": 146.227, "args": { "External id": 20194,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651240167.697, "dur": 13.061, "args": { "External id": 20195,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651240184.081, "dur": 82.531, "args": { "External id": 20196,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651240186.687, "dur": 79.572, "args": { "External id": 20197,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240190.579, "dur": 5.017, "args": { "External id": 20198,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651240197.672, "dur": 67.530, "args": { "External id": 20199,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2790 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.18", "pid": 1336757, "tid": 1381170, "ts": 1295651240419.886, "dur": 508.673, "args": { "External id": 20200,"Record function id": 0, "Ev Idx": 2791 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.18)", "pid": 1336757, "tid": 1381170, "ts": 1295651240438.551, "dur": 478.286, "args": { "External id": 20201,"Record function id": 0, "Ev Idx": 2792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651240495.215, "dur": 5.700, "args": { "External id": 20202,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651240516.047, "dur": 29.502, "args": { "External id": 20203,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240521.017, "dur": 1.651, "args": { "External id": 20204,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240524.760, "dur": 0.608, "args": { "External id": 20205,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240527.195, "dur": 0.325, "args": { "External id": 20206,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240528.959, "dur": 0.285, "args": { "External id": 20207,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240531.020, "dur": 0.380, "args": { "External id": 20208,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240532.945, "dur": 0.225, "args": { "External id": 20209,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240534.939, "dur": 0.258, "args": { "External id": 20210,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240536.746, "dur": 0.499, "args": { "External id": 20211,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240538.921, "dur": 0.451, "args": { "External id": 20212,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651240554.937, "dur": 28.882, "args": { "External id": 20213,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2804 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651240614.458, "dur": 92.665, "args": { "External id": 20214,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651240624.456, "dur": 3.396, "args": { "External id": 20215,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651240632.679, "dur": 9.711, "args": { "External id": 20216,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651240636.625, "dur": 5.370, "args": { "External id": 20217,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240640.020, "dur": 0.514, "args": { "External id": 20218,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651240648.356, "dur": 23.777, "args": { "External id": 20219,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240650.108, "dur": 0.399, "args": { "External id": 20220,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240652.165, "dur": 0.515, "args": { "External id": 20221,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240654.206, "dur": 0.748, "args": { "External id": 20222,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240656.496, "dur": 0.331, "args": { "External id": 20223,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240658.289, "dur": 0.412, "args": { "External id": 20224,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240660.359, "dur": 0.479, "args": { "External id": 20225,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240662.432, "dur": 0.307, "args": { "External id": 20226,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240664.616, "dur": 0.463, "args": { "External id": 20227,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651240666.773, "dur": 0.255, "args": { "External id": 20228,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651240681.472, "dur": 17.610, "args": { "External id": 20229,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2820 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651240750.057, "dur": 104.162, "args": { "External id": 20230,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2821 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651240771.157, "dur": 79.648, "args": { "External id": 20231,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2822, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651240780.206, "dur": 66.682, "args": { "External id": 20232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2823 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651240868.759, "dur": 1.927, "args": { "External id": 20233,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2824, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651240943.644, "dur": 1671.989, "args": { "External id": 20234,"Sequence number": 246580, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2825 } }, { "ph": "f", "id": 188, "pid": 1336757, "tid": 1381170, "ts": 1295651240943.644, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651241103.274, "dur": 104.187, "args": { "External id": 20235,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2826 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651241263.029, "dur": 42.287, "args": { "External id": 20236,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651241323.308, "dur": 53.398, "args": { "External id": 20237,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651241385.603, "dur": 33.419, "args": { "External id": 20238,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651241425.029, "dur": 45.312, "args": { "External id": 20239,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651241477.435, "dur": 27.930, "args": { "External id": 20240,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651241512.374, "dur": 42.117, "args": { "External id": 20241,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2832 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651241582.631, "dur": 24.236, "args": { "External id": 20242,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2833 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651241624.597, "dur": 28.479, "args": { "External id": 20243,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2834 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651241674.955, "dur": 20.293, "args": { "External id": 20244,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2835 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651241709.800, "dur": 16.303, "args": { "External id": 20245,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651241735.939, "dur": 30.806, "args": { "External id": 20246,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651241769.799, "dur": 33.309, "args": { "External id": 20247,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2838 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651241831.118, "dur": 209.504, "args": { "External id": 20248,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651241908.426, "dur": 6.649, "args": { "External id": 20249,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651241917.075, "dur": 3.071, "args": { "External id": 20250,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2841 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651242073.906, "dur": 28.741, "args": { "External id": 20251,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2842 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651242114.632, "dur": 15.954, "args": { "External id": 20252,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651242140.818, "dur": 42.389, "args": { "External id": 20253,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651242189.219, "dur": 35.685, "args": { "External id": 20254,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651242249.502, "dur": 27.323, "args": { "External id": 20255,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651242281.505, "dur": 30.272, "args": { "External id": 20256,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651242318.841, "dur": 22.050, "args": { "External id": 20257,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651242347.576, "dur": 29.123, "args": { "External id": 20258,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2849 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651242396.370, "dur": 26.191, "args": { "External id": 20259,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2850 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651242451.133, "dur": 31.257, "args": { "External id": 20260,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2851 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651242499.350, "dur": 17.951, "args": { "External id": 20261,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2852 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651242534.004, "dur": 20.028, "args": { "External id": 20262,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2853 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651242568.156, "dur": 16.349, "args": { "External id": 20263,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2854 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242657.766, "dur": 15.578, "args": { "External id": 20264,"Record function id": 0, "Ev Idx": 2855 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242661.348, "dur": 10.942, "args": { "External id": 20265,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242665.460, "dur": 6.010, "args": { "External id": 20266,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2857 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242666.864, "dur": 4.508, "args": { "External id": 20267,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2858 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242677.582, "dur": 4.691, "args": { "External id": 20268,"Record function id": 0, "Ev Idx": 2859 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242678.746, "dur": 3.024, "args": { "External id": 20269,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242679.306, "dur": 1.982, "args": { "External id": 20270,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2861 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242680.107, "dur": 1.113, "args": { "External id": 20271,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2862 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242685.553, "dur": 4.200, "args": { "External id": 20272,"Record function id": 0, "Ev Idx": 2863 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242686.599, "dur": 2.638, "args": { "External id": 20273,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242687.275, "dur": 1.521, "args": { "External id": 20274,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2865 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242687.940, "dur": 0.738, "args": { "External id": 20275,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2866 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242693.099, "dur": 4.679, "args": { "External id": 20276,"Record function id": 0, "Ev Idx": 2867 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242694.378, "dur": 2.940, "args": { "External id": 20277,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242695.141, "dur": 1.783, "args": { "External id": 20278,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2869 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242695.843, "dur": 0.975, "args": { "External id": 20279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2870 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242700.841, "dur": 4.231, "args": { "External id": 20280,"Record function id": 0, "Ev Idx": 2871 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242702.059, "dur": 2.584, "args": { "External id": 20281,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242702.814, "dur": 1.412, "args": { "External id": 20282,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2873 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242703.337, "dur": 0.823, "args": { "External id": 20283,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2874 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242708.310, "dur": 3.720, "args": { "External id": 20284,"Record function id": 0, "Ev Idx": 2875 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242709.377, "dur": 2.189, "args": { "External id": 20285,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242709.842, "dur": 1.300, "args": { "External id": 20286,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2877 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242710.268, "dur": 0.775, "args": { "External id": 20287,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2878 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242715.118, "dur": 3.627, "args": { "External id": 20288,"Record function id": 0, "Ev Idx": 2879 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242716.101, "dur": 2.209, "args": { "External id": 20289,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242716.571, "dur": 1.343, "args": { "External id": 20290,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2881 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242716.975, "dur": 0.868, "args": { "External id": 20291,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2882 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242721.972, "dur": 3.957, "args": { "External id": 20292,"Record function id": 0, "Ev Idx": 2883 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242723.058, "dur": 2.431, "args": { "External id": 20293,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242723.780, "dur": 1.296, "args": { "External id": 20294,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2885 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242724.161, "dur": 0.842, "args": { "External id": 20295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2886 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242729.093, "dur": 3.641, "args": { "External id": 20296,"Record function id": 0, "Ev Idx": 2887 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651242730.138, "dur": 2.156, "args": { "External id": 20297,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242730.619, "dur": 1.223, "args": { "External id": 20298,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2889 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651242731.145, "dur": 0.624, "args": { "External id": 20299,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2890 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651242736.186, "dur": 36017.298, "args": { "External id": 20300,"Record function id": 0, "Sequence number": 246579, "Fwd thread id": 1, "Ev Idx": 2891 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651242737.273, "dur": 36007.781, "args": { "External id": 20301,"Sequence number": 246579, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2892 } }, { "ph": "f", "id": 189, "pid": 1336757, "tid": 1381170, "ts": 1295651242737.273, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.19)", "pid": 1336757, "tid": 1381170, "ts": 1295651242764.551, "dur": 35.222, "args": { "External id": 20302,"Record function id": 0, "Ev Idx": 2893 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.19)", "pid": 1336757, "tid": 1381170, "ts": 1295651242807.057, "dur": 57.490, "args": { "External id": 20303,"Record function id": 0, "Ev Idx": 2894 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.19)", "pid": 1336757, "tid": 1381170, "ts": 1295651242870.361, "dur": 35866.250, "args": { "External id": 20304,"Record function id": 0, "Ev Idx": 2895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651242959.316, "dur": 6.707, "args": { "External id": 20305,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651242974.918, "dur": 4.565, "args": { "External id": 20306,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2897 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651243033.007, "dur": 34916.723, "args": { "External id": 20307,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651243046.530, "dur": 34894.099, "args": { "External id": 20308,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651243104.004, "dur": 14.243, "args": { "External id": 20309,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651243124.408, "dur": 34776.459, "args": { "External id": 20310,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651243127.165, "dur": 34772.814, "args": { "External id": 20311,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651243131.549, "dur": 5.750, "args": { "External id": 20312,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651243139.000, "dur": 34756.964, "args": { "External id": 20313,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651278069.457, "dur": 12.208, "args": { "External id": 20314,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651278074.161, "dur": 6.895, "args": { "External id": 20315,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2906 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651278110.383, "dur": 354.913, "args": { "External id": 20316,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2907 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651278138.030, "dur": 322.414, "args": { "External id": 20317,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2908, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651278149.347, "dur": 305.278, "args": { "External id": 20318,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2909 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651278485.443, "dur": 2.152, "args": { "External id": 20319,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2910, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651278543.332, "dur": 6.859, "args": { "External id": 20320,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651278593.094, "dur": 1.791, "args": { "External id": 20321,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651278610.239, "dur": 1.175, "args": { "External id": 20322,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651278622.844, "dur": 0.983, "args": { "External id": 20323,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651278633.625, "dur": 0.916, "args": { "External id": 20324,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651278643.613, "dur": 1.123, "args": { "External id": 20325,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651278654.232, "dur": 1.065, "args": { "External id": 20326,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651278665.998, "dur": 1.587, "args": { "External id": 20327,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651278677.084, "dur": 1.023, "args": { "External id": 20328,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2919 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651278766.692, "dur": 2685.461, "args": { "External id": 20329,"Record function id": 0, "Ev Idx": 2920 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.18)", "pid": 1336757, "tid": 1381170, "ts": 1295651278785.280, "dur": 997.089, "args": { "External id": 20330,"Record function id": 0, "Ev Idx": 2921 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.18)", "pid": 1336757, "tid": 1381170, "ts": 1295651278798.524, "dur": 351.684, "args": { "External id": 20331,"Record function id": 0, "Ev Idx": 2922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651278872.227, "dur": 4.116, "args": { "External id": 20332,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651278879.752, "dur": 1.115, "args": { "External id": 20333,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651278884.710, "dur": 1.087, "args": { "External id": 20334,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651278887.088, "dur": 0.911, "args": { "External id": 20335,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651278889.345, "dur": 0.781, "args": { "External id": 20336,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651278891.461, "dur": 0.869, "args": { "External id": 20337,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651278895.974, "dur": 1.224, "args": { "External id": 20338,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651278898.594, "dur": 0.577, "args": { "External id": 20339,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651278900.632, "dur": 0.959, "args": { "External id": 20340,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651278902.878, "dur": 0.763, "args": { "External id": 20341,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2932 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651278923.104, "dur": 194.877, "args": { "External id": 20342,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651278938.107, "dur": 174.801, "args": { "External id": 20343,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651278954.528, "dur": 11.852, "args": { "External id": 20344,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651278969.248, "dur": 115.108, "args": { "External id": 20345,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651278971.752, "dur": 112.190, "args": { "External id": 20346,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651278975.449, "dur": 5.385, "args": { "External id": 20347,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651279031.815, "dur": 51.274, "args": { "External id": 20348,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2939 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.17", "pid": 1336757, "tid": 1381170, "ts": 1295651279245.031, "dur": 529.949, "args": { "External id": 20349,"Record function id": 0, "Ev Idx": 2940 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.17)", "pid": 1336757, "tid": 1381170, "ts": 1295651279264.463, "dur": 498.697, "args": { "External id": 20350,"Record function id": 0, "Ev Idx": 2941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651279320.293, "dur": 6.786, "args": { "External id": 20351,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651279342.753, "dur": 29.669, "args": { "External id": 20352,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279347.473, "dur": 2.263, "args": { "External id": 20353,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279351.964, "dur": 0.471, "args": { "External id": 20354,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279354.112, "dur": 0.289, "args": { "External id": 20355,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279355.928, "dur": 0.564, "args": { "External id": 20356,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279357.593, "dur": 0.669, "args": { "External id": 20357,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279359.475, "dur": 0.222, "args": { "External id": 20358,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279363.842, "dur": 0.448, "args": { "External id": 20359,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279365.775, "dur": 0.300, "args": { "External id": 20360,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279367.651, "dur": 0.258, "args": { "External id": 20361,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651279382.091, "dur": 31.851, "args": { "External id": 20362,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2953 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651279447.734, "dur": 93.882, "args": { "External id": 20363,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651279457.840, "dur": 3.500, "args": { "External id": 20364,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651279466.430, "dur": 9.958, "args": { "External id": 20365,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651279470.643, "dur": 5.331, "args": { "External id": 20366,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279474.064, "dur": 0.688, "args": { "External id": 20367,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651279482.494, "dur": 18.500, "args": { "External id": 20368,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279484.566, "dur": 0.551, "args": { "External id": 20369,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279486.533, "dur": 0.481, "args": { "External id": 20370,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279488.140, "dur": 0.248, "args": { "External id": 20371,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279489.578, "dur": 0.326, "args": { "External id": 20372,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279491.281, "dur": 0.237, "args": { "External id": 20373,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279492.618, "dur": 0.475, "args": { "External id": 20374,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279494.193, "dur": 0.317, "args": { "External id": 20375,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279495.624, "dur": 0.270, "args": { "External id": 20376,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651279497.305, "dur": 0.248, "args": { "External id": 20377,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651279514.485, "dur": 19.277, "args": { "External id": 20378,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2969 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651279585.115, "dur": 111.194, "args": { "External id": 20379,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2970 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651279613.586, "dur": 79.219, "args": { "External id": 20380,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2971, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651279622.567, "dur": 66.291, "args": { "External id": 20381,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2972 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651279714.982, "dur": 2.047, "args": { "External id": 20382,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2973, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651279789.565, "dur": 1638.334, "args": { "External id": 20383,"Sequence number": 246578, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2974 } }, { "ph": "f", "id": 190, "pid": 1336757, "tid": 1381170, "ts": 1295651279789.565, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651279893.582, "dur": 153.894, "args": { "External id": 20384,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2975 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651280092.917, "dur": 39.797, "args": { "External id": 20385,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651280149.418, "dur": 55.345, "args": { "External id": 20386,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651280215.137, "dur": 50.609, "args": { "External id": 20387,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651280275.224, "dur": 47.421, "args": { "External id": 20388,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651280329.865, "dur": 27.702, "args": { "External id": 20389,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651280364.875, "dur": 41.635, "args": { "External id": 20390,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2981 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651280432.492, "dur": 24.598, "args": { "External id": 20391,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2982 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651280474.665, "dur": 26.429, "args": { "External id": 20392,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2983 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651280523.190, "dur": 19.454, "args": { "External id": 20393,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2984 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651280555.018, "dur": 15.293, "args": { "External id": 20394,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651280579.541, "dur": 28.994, "args": { "External id": 20395,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651280611.918, "dur": 31.889, "args": { "External id": 20396,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2987 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651280668.984, "dur": 165.395, "args": { "External id": 20397,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651280746.589, "dur": 5.896, "args": { "External id": 20398,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651280754.145, "dur": 2.260, "args": { "External id": 20399,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2990 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651280861.668, "dur": 23.525, "args": { "External id": 20400,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2991 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651280898.102, "dur": 15.539, "args": { "External id": 20401,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651280922.126, "dur": 34.975, "args": { "External id": 20402,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651280962.763, "dur": 71.796, "args": { "External id": 20403,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651281045.728, "dur": 26.013, "args": { "External id": 20404,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651281076.132, "dur": 31.805, "args": { "External id": 20405,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651281113.820, "dur": 21.778, "args": { "External id": 20406,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651281141.699, "dur": 29.096, "args": { "External id": 20407,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2998 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651281190.619, "dur": 23.823, "args": { "External id": 20408,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2999 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651281245.654, "dur": 45.260, "args": { "External id": 20409,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3000 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651281314.857, "dur": 19.713, "args": { "External id": 20410,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3001 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651281352.425, "dur": 16.152, "args": { "External id": 20411,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3002 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651281384.197, "dur": 17.156, "args": { "External id": 20412,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3003 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281474.293, "dur": 18.046, "args": { "External id": 20413,"Record function id": 0, "Ev Idx": 3004 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281477.635, "dur": 13.681, "args": { "External id": 20414,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281481.688, "dur": 8.805, "args": { "External id": 20415,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3006 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281483.157, "dur": 7.245, "args": { "External id": 20416,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3007 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281496.198, "dur": 4.577, "args": { "External id": 20417,"Record function id": 0, "Ev Idx": 3008 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281497.371, "dur": 2.932, "args": { "External id": 20418,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281498.339, "dur": 1.518, "args": { "External id": 20419,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3010 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281499.019, "dur": 0.768, "args": { "External id": 20420,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3011 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281504.192, "dur": 4.864, "args": { "External id": 20421,"Record function id": 0, "Ev Idx": 3012 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281505.670, "dur": 2.921, "args": { "External id": 20422,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281506.314, "dur": 1.888, "args": { "External id": 20423,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3014 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281507.119, "dur": 0.986, "args": { "External id": 20424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3015 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281512.176, "dur": 3.719, "args": { "External id": 20425,"Record function id": 0, "Ev Idx": 3016 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281513.114, "dur": 2.328, "args": { "External id": 20426,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281513.710, "dur": 1.332, "args": { "External id": 20427,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3018 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281514.202, "dur": 0.724, "args": { "External id": 20428,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3019 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281518.954, "dur": 3.883, "args": { "External id": 20429,"Record function id": 0, "Ev Idx": 3020 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281519.963, "dur": 2.438, "args": { "External id": 20430,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281520.569, "dur": 1.404, "args": { "External id": 20431,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3022 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281520.990, "dur": 0.916, "args": { "External id": 20432,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3023 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281525.970, "dur": 3.333, "args": { "External id": 20433,"Record function id": 0, "Ev Idx": 3024 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281526.825, "dur": 2.048, "args": { "External id": 20434,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281527.341, "dur": 1.115, "args": { "External id": 20435,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3026 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281527.807, "dur": 0.575, "args": { "External id": 20436,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3027 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281532.619, "dur": 3.670, "args": { "External id": 20437,"Record function id": 0, "Ev Idx": 3028 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281533.638, "dur": 2.199, "args": { "External id": 20438,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281534.297, "dur": 1.112, "args": { "External id": 20439,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3030 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281534.572, "dur": 0.771, "args": { "External id": 20440,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3031 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281539.302, "dur": 3.453, "args": { "External id": 20441,"Record function id": 0, "Ev Idx": 3032 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281540.410, "dur": 1.929, "args": { "External id": 20442,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281540.883, "dur": 1.052, "args": { "External id": 20443,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3034 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281541.156, "dur": 0.713, "args": { "External id": 20444,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3035 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281545.782, "dur": 5.549, "args": { "External id": 20445,"Record function id": 0, "Ev Idx": 3036 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651281547.228, "dur": 3.662, "args": { "External id": 20446,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281547.707, "dur": 2.782, "args": { "External id": 20447,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3038 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651281549.723, "dur": 0.661, "args": { "External id": 20448,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3039 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651281554.875, "dur": 36338.899, "args": { "External id": 20449,"Record function id": 0, "Sequence number": 246577, "Fwd thread id": 1, "Ev Idx": 3040 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651281556.067, "dur": 36329.549, "args": { "External id": 20450,"Sequence number": 246577, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3041 } }, { "ph": "f", "id": 191, "pid": 1336757, "tid": 1381170, "ts": 1295651281556.067, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.18)", "pid": 1336757, "tid": 1381170, "ts": 1295651281583.188, "dur": 36.733, "args": { "External id": 20451,"Record function id": 0, "Ev Idx": 3042 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.18)", "pid": 1336757, "tid": 1381170, "ts": 1295651281626.824, "dur": 54.745, "args": { "External id": 20452,"Record function id": 0, "Ev Idx": 3043 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.18)", "pid": 1336757, "tid": 1381170, "ts": 1295651281686.677, "dur": 36191.318, "args": { "External id": 20453,"Record function id": 0, "Ev Idx": 3044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651281769.560, "dur": 6.380, "args": { "External id": 20454,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651281784.070, "dur": 4.364, "args": { "External id": 20455,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3046 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651281802.374, "dur": 35253.431, "args": { "External id": 20456,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651281822.510, "dur": 35224.318, "args": { "External id": 20457,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651281869.679, "dur": 13.417, "args": { "External id": 20458,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651281888.919, "dur": 35118.345, "args": { "External id": 20459,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651281891.643, "dur": 35114.721, "args": { "External id": 20460,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651281895.786, "dur": 5.279, "args": { "External id": 20461,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651281902.756, "dur": 35077.469, "args": { "External id": 20462,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651317149.665, "dur": 10.098, "args": { "External id": 20463,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651317152.765, "dur": 6.641, "args": { "External id": 20464,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3055 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651317188.167, "dur": 406.443, "args": { "External id": 20465,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3056 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651317219.610, "dur": 369.810, "args": { "External id": 20466,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3057, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651317241.893, "dur": 341.931, "args": { "External id": 20467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3058 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651317618.517, "dur": 2.419, "args": { "External id": 20468,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3059, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651317681.989, "dur": 6.897, "args": { "External id": 20469,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651317731.973, "dur": 1.594, "args": { "External id": 20470,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651317748.729, "dur": 1.333, "args": { "External id": 20471,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651317762.305, "dur": 1.127, "args": { "External id": 20472,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651317773.519, "dur": 0.842, "args": { "External id": 20473,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651317783.816, "dur": 0.846, "args": { "External id": 20474,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651317796.440, "dur": 1.054, "args": { "External id": 20475,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651317807.511, "dur": 1.941, "args": { "External id": 20476,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651317818.464, "dur": 1.068, "args": { "External id": 20477,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3068 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651317907.515, "dur": 2691.407, "args": { "External id": 20478,"Record function id": 0, "Ev Idx": 3069 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.17)", "pid": 1336757, "tid": 1381170, "ts": 1295651317926.199, "dur": 1015.115, "args": { "External id": 20479,"Record function id": 0, "Ev Idx": 3070 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.17)", "pid": 1336757, "tid": 1381170, "ts": 1295651317941.225, "dur": 394.727, "args": { "External id": 20480,"Record function id": 0, "Ev Idx": 3071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651318090.387, "dur": 5.419, "args": { "External id": 20481,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651318099.489, "dur": 0.892, "args": { "External id": 20482,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651318103.801, "dur": 0.880, "args": { "External id": 20483,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651318106.212, "dur": 0.762, "args": { "External id": 20484,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651318108.249, "dur": 0.905, "args": { "External id": 20485,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651318110.693, "dur": 0.888, "args": { "External id": 20486,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651318114.827, "dur": 1.456, "args": { "External id": 20487,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651318117.614, "dur": 0.842, "args": { "External id": 20488,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651318119.608, "dur": 0.843, "args": { "External id": 20489,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651318121.845, "dur": 0.891, "args": { "External id": 20490,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3081 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651318144.671, "dur": 156.874, "args": { "External id": 20491,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651318160.388, "dur": 136.295, "args": { "External id": 20492,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651318174.168, "dur": 12.045, "args": { "External id": 20493,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651318188.964, "dur": 79.571, "args": { "External id": 20494,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651318191.226, "dur": 76.980, "args": { "External id": 20495,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318195.283, "dur": 5.123, "args": { "External id": 20496,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651318201.910, "dur": 65.242, "args": { "External id": 20497,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3088 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.16", "pid": 1336757, "tid": 1381170, "ts": 1295651318418.008, "dur": 515.939, "args": { "External id": 20498,"Record function id": 0, "Ev Idx": 3089 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.16)", "pid": 1336757, "tid": 1381170, "ts": 1295651318433.807, "dur": 488.433, "args": { "External id": 20499,"Record function id": 0, "Ev Idx": 3090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651318488.811, "dur": 5.026, "args": { "External id": 20500,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651318510.305, "dur": 25.040, "args": { "External id": 20501,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318515.389, "dur": 1.610, "args": { "External id": 20502,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318518.931, "dur": 0.390, "args": { "External id": 20503,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318520.670, "dur": 0.471, "args": { "External id": 20504,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318522.310, "dur": 0.321, "args": { "External id": 20505,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318523.653, "dur": 0.807, "args": { "External id": 20506,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318525.551, "dur": 0.814, "args": { "External id": 20507,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318527.449, "dur": 0.552, "args": { "External id": 20508,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318529.246, "dur": 0.262, "args": { "External id": 20509,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318530.627, "dur": 0.222, "args": { "External id": 20510,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651318544.972, "dur": 28.523, "args": { "External id": 20511,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3102 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651318603.781, "dur": 99.485, "args": { "External id": 20512,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651318613.915, "dur": 3.459, "args": { "External id": 20513,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651318622.360, "dur": 10.522, "args": { "External id": 20514,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651318626.750, "dur": 5.597, "args": { "External id": 20515,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318630.323, "dur": 0.574, "args": { "External id": 20516,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651318639.845, "dur": 19.804, "args": { "External id": 20517,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318641.931, "dur": 0.806, "args": { "External id": 20518,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318643.992, "dur": 0.520, "args": { "External id": 20519,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318645.766, "dur": 0.446, "args": { "External id": 20520,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318647.549, "dur": 0.282, "args": { "External id": 20521,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318649.003, "dur": 0.589, "args": { "External id": 20522,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318650.821, "dur": 0.415, "args": { "External id": 20523,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318652.543, "dur": 0.353, "args": { "External id": 20524,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318653.949, "dur": 0.384, "args": { "External id": 20525,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651318655.408, "dur": 0.483, "args": { "External id": 20526,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651318676.229, "dur": 19.023, "args": { "External id": 20527,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3118 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651318745.553, "dur": 112.298, "args": { "External id": 20528,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3119 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651318773.600, "dur": 81.140, "args": { "External id": 20529,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3120, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651318783.067, "dur": 67.800, "args": { "External id": 20530,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3121 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651318874.291, "dur": 2.009, "args": { "External id": 20531,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3122, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651318948.238, "dur": 1630.568, "args": { "External id": 20532,"Sequence number": 246576, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3123 } }, { "ph": "f", "id": 192, "pid": 1336757, "tid": 1381170, "ts": 1295651318948.238, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651319102.960, "dur": 104.787, "args": { "External id": 20533,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3124 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651319264.153, "dur": 40.248, "args": { "External id": 20534,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651319322.797, "dur": 52.354, "args": { "External id": 20535,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651319385.317, "dur": 32.343, "args": { "External id": 20536,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651319424.016, "dur": 45.135, "args": { "External id": 20537,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651319476.065, "dur": 27.088, "args": { "External id": 20538,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651319510.539, "dur": 40.945, "args": { "External id": 20539,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3130 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651319574.830, "dur": 22.895, "args": { "External id": 20540,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3131 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651319616.896, "dur": 27.251, "args": { "External id": 20541,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3132 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651319662.580, "dur": 20.012, "args": { "External id": 20542,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3133 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651319697.068, "dur": 16.114, "args": { "External id": 20543,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651319722.471, "dur": 29.186, "args": { "External id": 20544,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651319754.480, "dur": 32.240, "args": { "External id": 20545,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3136 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651319812.300, "dur": 158.818, "args": { "External id": 20546,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651319883.823, "dur": 5.852, "args": { "External id": 20547,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651319891.476, "dur": 2.293, "args": { "External id": 20548,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3139 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651320039.435, "dur": 28.271, "args": { "External id": 20549,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3140 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651320085.764, "dur": 14.854, "args": { "External id": 20550,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651320110.039, "dur": 41.221, "args": { "External id": 20551,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651320156.861, "dur": 33.919, "args": { "External id": 20552,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651320196.466, "dur": 21.816, "args": { "External id": 20553,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651320222.229, "dur": 44.965, "args": { "External id": 20554,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651320275.476, "dur": 23.550, "args": { "External id": 20555,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651320305.422, "dur": 29.121, "args": { "External id": 20556,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3147 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651320356.435, "dur": 35.571, "args": { "External id": 20557,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3148 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651320416.672, "dur": 27.410, "args": { "External id": 20558,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3149 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651320459.709, "dur": 17.861, "args": { "External id": 20559,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3150 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651320493.338, "dur": 18.522, "args": { "External id": 20560,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3151 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651320524.575, "dur": 23.321, "args": { "External id": 20561,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3152 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320620.711, "dur": 15.121, "args": { "External id": 20562,"Record function id": 0, "Ev Idx": 3153 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320623.804, "dur": 11.095, "args": { "External id": 20563,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320627.891, "dur": 6.194, "args": { "External id": 20564,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3155 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320629.475, "dur": 4.478, "args": { "External id": 20565,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3156 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320639.770, "dur": 4.611, "args": { "External id": 20566,"Record function id": 0, "Ev Idx": 3157 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320641.171, "dur": 2.717, "args": { "External id": 20567,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320641.844, "dur": 1.461, "args": { "External id": 20568,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3159 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320642.368, "dur": 0.871, "args": { "External id": 20569,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3160 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320647.684, "dur": 4.153, "args": { "External id": 20570,"Record function id": 0, "Ev Idx": 3161 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320648.897, "dur": 2.476, "args": { "External id": 20571,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320649.520, "dur": 1.413, "args": { "External id": 20572,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3163 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320650.087, "dur": 0.762, "args": { "External id": 20573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3164 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320655.018, "dur": 4.453, "args": { "External id": 20574,"Record function id": 0, "Ev Idx": 3165 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320655.989, "dur": 3.039, "args": { "External id": 20575,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320656.679, "dur": 1.946, "args": { "External id": 20576,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3167 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320657.596, "dur": 0.952, "args": { "External id": 20577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3168 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320662.544, "dur": 4.120, "args": { "External id": 20578,"Record function id": 0, "Ev Idx": 3169 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320663.518, "dur": 2.701, "args": { "External id": 20579,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320664.248, "dur": 1.561, "args": { "External id": 20580,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3171 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320664.859, "dur": 0.876, "args": { "External id": 20581,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3172 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320669.718, "dur": 4.179, "args": { "External id": 20582,"Record function id": 0, "Ev Idx": 3173 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320670.750, "dur": 2.692, "args": { "External id": 20583,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320671.201, "dur": 1.854, "args": { "External id": 20584,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3175 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320671.925, "dur": 1.063, "args": { "External id": 20585,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3176 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320677.110, "dur": 4.014, "args": { "External id": 20586,"Record function id": 0, "Ev Idx": 3177 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320678.357, "dur": 2.331, "args": { "External id": 20587,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320679.042, "dur": 1.261, "args": { "External id": 20588,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3179 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320679.541, "dur": 0.687, "args": { "External id": 20589,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3180 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320684.652, "dur": 3.312, "args": { "External id": 20590,"Record function id": 0, "Ev Idx": 3181 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320685.588, "dur": 1.948, "args": { "External id": 20591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320686.062, "dur": 1.075, "args": { "External id": 20592,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3183 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320686.338, "dur": 0.725, "args": { "External id": 20593,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3184 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320691.377, "dur": 4.063, "args": { "External id": 20594,"Record function id": 0, "Ev Idx": 3185 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651320692.416, "dur": 2.599, "args": { "External id": 20595,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320692.899, "dur": 1.702, "args": { "External id": 20596,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3187 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651320693.393, "dur": 1.142, "args": { "External id": 20597,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3188 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651320699.042, "dur": 36168.824, "args": { "External id": 20598,"Record function id": 0, "Sequence number": 246575, "Fwd thread id": 1, "Ev Idx": 3189 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651320700.093, "dur": 36159.376, "args": { "External id": 20599,"Sequence number": 246575, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3190 } }, { "ph": "f", "id": 193, "pid": 1336757, "tid": 1381170, "ts": 1295651320700.093, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.17)", "pid": 1336757, "tid": 1381170, "ts": 1295651320729.130, "dur": 37.908, "args": { "External id": 20600,"Record function id": 0, "Ev Idx": 3191 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.17)", "pid": 1336757, "tid": 1381170, "ts": 1295651320774.678, "dur": 59.217, "args": { "External id": 20601,"Record function id": 0, "Ev Idx": 3192 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.17)", "pid": 1336757, "tid": 1381170, "ts": 1295651320840.088, "dur": 36011.253, "args": { "External id": 20602,"Record function id": 0, "Ev Idx": 3193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651320927.871, "dur": 6.882, "args": { "External id": 20603,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651320943.659, "dur": 4.796, "args": { "External id": 20604,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3195 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651320962.760, "dur": 35046.533, "args": { "External id": 20605,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651320975.748, "dur": 35000.771, "args": { "External id": 20606,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651321060.775, "dur": 14.139, "args": { "External id": 20607,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651321081.089, "dur": 34857.201, "args": { "External id": 20608,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651321083.881, "dur": 34853.756, "args": { "External id": 20609,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651321087.799, "dur": 6.020, "args": { "External id": 20610,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651321095.486, "dur": 34839.205, "args": { "External id": 20611,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651356099.207, "dur": 9.201, "args": { "External id": 20612,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651356102.044, "dur": 6.040, "args": { "External id": 20613,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3204 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651356134.138, "dur": 431.695, "args": { "External id": 20614,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3205 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651356165.731, "dur": 394.997, "args": { "External id": 20615,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3206, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651356176.989, "dur": 378.169, "args": { "External id": 20616,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3207 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651356590.335, "dur": 2.499, "args": { "External id": 20617,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3208, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651356654.783, "dur": 6.676, "args": { "External id": 20618,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651356705.110, "dur": 1.622, "args": { "External id": 20619,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651356721.967, "dur": 1.254, "args": { "External id": 20620,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651356734.728, "dur": 1.212, "args": { "External id": 20621,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651356745.580, "dur": 1.050, "args": { "External id": 20622,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651356755.833, "dur": 1.162, "args": { "External id": 20623,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651356768.895, "dur": 1.094, "args": { "External id": 20624,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651356780.400, "dur": 1.414, "args": { "External id": 20625,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651356790.877, "dur": 1.158, "args": { "External id": 20626,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3217 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651356882.677, "dur": 2726.849, "args": { "External id": 20627,"Record function id": 0, "Ev Idx": 3218 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.16)", "pid": 1336757, "tid": 1381170, "ts": 1295651356901.709, "dur": 1039.113, "args": { "External id": 20628,"Record function id": 0, "Ev Idx": 3219 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.16)", "pid": 1336757, "tid": 1381170, "ts": 1295651356915.721, "dur": 404.732, "args": { "External id": 20629,"Record function id": 0, "Ev Idx": 3220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651357042.529, "dur": 5.163, "args": { "External id": 20630,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651357051.541, "dur": 1.054, "args": { "External id": 20631,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651357056.698, "dur": 0.978, "args": { "External id": 20632,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651357059.319, "dur": 1.975, "args": { "External id": 20633,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651357062.728, "dur": 1.450, "args": { "External id": 20634,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651357065.463, "dur": 1.648, "args": { "External id": 20635,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651357070.544, "dur": 1.613, "args": { "External id": 20636,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651357073.777, "dur": 1.132, "args": { "External id": 20637,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651357076.373, "dur": 1.525, "args": { "External id": 20638,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651357079.391, "dur": 1.420, "args": { "External id": 20639,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3230 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651357101.638, "dur": 177.727, "args": { "External id": 20640,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651357117.473, "dur": 144.012, "args": { "External id": 20641,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651357135.648, "dur": 13.201, "args": { "External id": 20642,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651357151.874, "dur": 65.574, "args": { "External id": 20643,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651357154.330, "dur": 62.815, "args": { "External id": 20644,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357158.250, "dur": 6.147, "args": { "External id": 20645,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651357166.079, "dur": 50.392, "args": { "External id": 20646,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3237 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.15", "pid": 1336757, "tid": 1381170, "ts": 1295651357408.285, "dur": 524.537, "args": { "External id": 20647,"Record function id": 0, "Ev Idx": 3238 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.15)", "pid": 1336757, "tid": 1381170, "ts": 1295651357425.153, "dur": 495.763, "args": { "External id": 20648,"Record function id": 0, "Ev Idx": 3239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651357481.675, "dur": 6.413, "args": { "External id": 20649,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651357503.897, "dur": 28.680, "args": { "External id": 20650,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357508.788, "dur": 2.187, "args": { "External id": 20651,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357512.879, "dur": 0.763, "args": { "External id": 20652,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357515.072, "dur": 0.853, "args": { "External id": 20653,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357517.366, "dur": 1.208, "args": { "External id": 20654,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357519.792, "dur": 0.906, "args": { "External id": 20655,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357521.987, "dur": 0.678, "args": { "External id": 20656,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357523.886, "dur": 0.729, "args": { "External id": 20657,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357526.199, "dur": 0.569, "args": { "External id": 20658,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357527.754, "dur": 0.321, "args": { "External id": 20659,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651357542.172, "dur": 31.860, "args": { "External id": 20660,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3251 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651357606.043, "dur": 97.926, "args": { "External id": 20661,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651357616.381, "dur": 3.394, "args": { "External id": 20662,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651357624.624, "dur": 10.070, "args": { "External id": 20663,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651357628.827, "dur": 5.458, "args": { "External id": 20664,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357632.018, "dur": 0.854, "args": { "External id": 20665,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651357641.217, "dur": 23.620, "args": { "External id": 20666,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357643.259, "dur": 0.769, "args": { "External id": 20667,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357645.208, "dur": 0.810, "args": { "External id": 20668,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357646.936, "dur": 0.654, "args": { "External id": 20669,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357648.725, "dur": 0.589, "args": { "External id": 20670,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357650.450, "dur": 0.410, "args": { "External id": 20671,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357651.842, "dur": 0.905, "args": { "External id": 20672,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357653.615, "dur": 1.067, "args": { "External id": 20673,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357655.351, "dur": 0.753, "args": { "External id": 20674,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651357656.920, "dur": 0.559, "args": { "External id": 20675,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651357678.395, "dur": 17.970, "args": { "External id": 20676,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3267 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651357745.904, "dur": 112.465, "args": { "External id": 20677,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3268 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651357773.504, "dur": 81.672, "args": { "External id": 20678,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3269, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651357782.706, "dur": 68.079, "args": { "External id": 20679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3270 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651357874.950, "dur": 1.995, "args": { "External id": 20680,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3271, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651357947.831, "dur": 1640.796, "args": { "External id": 20681,"Sequence number": 246574, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3272 } }, { "ph": "f", "id": 194, "pid": 1336757, "tid": 1381170, "ts": 1295651357947.831, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651358092.333, "dur": 103.861, "args": { "External id": 20682,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3273 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651358250.640, "dur": 40.667, "args": { "External id": 20683,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651358309.319, "dur": 53.791, "args": { "External id": 20684,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651358372.383, "dur": 32.639, "args": { "External id": 20685,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651358411.367, "dur": 45.870, "args": { "External id": 20686,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651358472.855, "dur": 27.888, "args": { "External id": 20687,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651358507.797, "dur": 42.397, "args": { "External id": 20688,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3279 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651358576.980, "dur": 22.460, "args": { "External id": 20689,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3280 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651358618.385, "dur": 26.386, "args": { "External id": 20690,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3281 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651358666.719, "dur": 19.780, "args": { "External id": 20691,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3282 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651358700.444, "dur": 16.316, "args": { "External id": 20692,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651358726.061, "dur": 29.932, "args": { "External id": 20693,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651358758.832, "dur": 33.440, "args": { "External id": 20694,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3285 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651358817.586, "dur": 205.051, "args": { "External id": 20695,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651358895.184, "dur": 6.178, "args": { "External id": 20696,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651358903.277, "dur": 2.799, "args": { "External id": 20697,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3288 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651359058.079, "dur": 29.073, "args": { "External id": 20698,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3289 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651359098.241, "dur": 15.335, "args": { "External id": 20699,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651359123.608, "dur": 41.319, "args": { "External id": 20700,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651359171.295, "dur": 34.562, "args": { "External id": 20701,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651359212.271, "dur": 37.175, "args": { "External id": 20702,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651359257.263, "dur": 33.547, "args": { "External id": 20703,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651359296.950, "dur": 22.018, "args": { "External id": 20704,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651359325.366, "dur": 29.476, "args": { "External id": 20705,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3296 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651359384.772, "dur": 30.672, "args": { "External id": 20706,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3297 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651359437.491, "dur": 23.962, "args": { "External id": 20707,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3298 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651359476.801, "dur": 21.118, "args": { "External id": 20708,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3299 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651359513.829, "dur": 15.184, "args": { "External id": 20709,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3300 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651359542.165, "dur": 18.640, "args": { "External id": 20710,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3301 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359631.517, "dur": 14.904, "args": { "External id": 20711,"Record function id": 0, "Ev Idx": 3302 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359634.956, "dur": 10.492, "args": { "External id": 20712,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359638.728, "dur": 5.801, "args": { "External id": 20713,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3304 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359640.070, "dur": 4.367, "args": { "External id": 20714,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3305 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359650.392, "dur": 5.081, "args": { "External id": 20715,"Record function id": 0, "Ev Idx": 3306 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359651.894, "dur": 3.100, "args": { "External id": 20716,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359652.759, "dur": 1.789, "args": { "External id": 20717,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3308 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359653.441, "dur": 1.009, "args": { "External id": 20718,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3309 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359658.873, "dur": 4.516, "args": { "External id": 20719,"Record function id": 0, "Ev Idx": 3310 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359660.605, "dur": 2.319, "args": { "External id": 20720,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359661.138, "dur": 1.381, "args": { "External id": 20721,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3312 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359661.590, "dur": 0.823, "args": { "External id": 20722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3313 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359666.746, "dur": 4.593, "args": { "External id": 20723,"Record function id": 0, "Ev Idx": 3314 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359668.121, "dur": 2.809, "args": { "External id": 20724,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359668.696, "dur": 1.842, "args": { "External id": 20725,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3316 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359669.174, "dur": 1.245, "args": { "External id": 20726,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3317 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359674.440, "dur": 3.898, "args": { "External id": 20727,"Record function id": 0, "Ev Idx": 3318 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359675.607, "dur": 2.305, "args": { "External id": 20728,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359676.225, "dur": 1.263, "args": { "External id": 20729,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3320 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359676.610, "dur": 0.816, "args": { "External id": 20730,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3321 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359681.390, "dur": 5.719, "args": { "External id": 20731,"Record function id": 0, "Ev Idx": 3322 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359682.466, "dur": 4.235, "args": { "External id": 20732,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359683.054, "dur": 3.232, "args": { "External id": 20733,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3324 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359683.693, "dur": 2.520, "args": { "External id": 20734,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3325 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359690.372, "dur": 3.833, "args": { "External id": 20735,"Record function id": 0, "Ev Idx": 3326 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359691.529, "dur": 2.281, "args": { "External id": 20736,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359691.996, "dur": 1.383, "args": { "External id": 20737,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3328 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359692.279, "dur": 1.034, "args": { "External id": 20738,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3329 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359697.293, "dur": 3.864, "args": { "External id": 20739,"Record function id": 0, "Ev Idx": 3330 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359698.681, "dur": 2.044, "args": { "External id": 20740,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359699.178, "dur": 1.147, "args": { "External id": 20741,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3332 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359699.472, "dur": 0.779, "args": { "External id": 20742,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3333 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359704.202, "dur": 3.405, "args": { "External id": 20743,"Record function id": 0, "Ev Idx": 3334 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651359705.239, "dur": 1.950, "args": { "External id": 20744,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359705.700, "dur": 1.097, "args": { "External id": 20745,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3336 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651359706.046, "dur": 0.684, "args": { "External id": 20746,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3337 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651359711.567, "dur": 36586.763, "args": { "External id": 20747,"Record function id": 0, "Sequence number": 246573, "Fwd thread id": 1, "Ev Idx": 3338 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651359712.730, "dur": 36576.031, "args": { "External id": 20748,"Sequence number": 246573, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3339 } }, { "ph": "f", "id": 195, "pid": 1336757, "tid": 1381170, "ts": 1295651359712.730, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.16)", "pid": 1336757, "tid": 1381170, "ts": 1295651359741.657, "dur": 35.570, "args": { "External id": 20749,"Record function id": 0, "Ev Idx": 3340 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.16)", "pid": 1336757, "tid": 1381170, "ts": 1295651359784.473, "dur": 59.863, "args": { "External id": 20750,"Record function id": 0, "Ev Idx": 3341 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.16)", "pid": 1336757, "tid": 1381170, "ts": 1295651359849.993, "dur": 36430.638, "args": { "External id": 20751,"Record function id": 0, "Ev Idx": 3342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651359934.254, "dur": 6.271, "args": { "External id": 20752,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651359949.412, "dur": 4.712, "args": { "External id": 20753,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3344 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651359968.161, "dur": 35363.322, "args": { "External id": 20754,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651359980.574, "dur": 35341.079, "args": { "External id": 20755,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651360068.900, "dur": 14.248, "args": { "External id": 20756,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651360089.218, "dur": 35190.021, "args": { "External id": 20757,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651360091.835, "dur": 35186.697, "args": { "External id": 20758,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651360095.762, "dur": 5.860, "args": { "External id": 20759,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651360103.107, "dur": 35171.861, "args": { "External id": 20760,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651395424.656, "dur": 10.222, "args": { "External id": 20761,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651395427.595, "dur": 6.940, "args": { "External id": 20762,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3353 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651395462.484, "dur": 458.761, "args": { "External id": 20763,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3354 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651395495.004, "dur": 420.411, "args": { "External id": 20764,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3355, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651395505.819, "dur": 403.719, "args": { "External id": 20765,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3356 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651395951.540, "dur": 2.580, "args": { "External id": 20766,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3357, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396060.404, "dur": 7.029, "args": { "External id": 20767,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396113.422, "dur": 1.945, "args": { "External id": 20768,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396130.627, "dur": 1.452, "args": { "External id": 20769,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396144.706, "dur": 1.086, "args": { "External id": 20770,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396156.510, "dur": 1.196, "args": { "External id": 20771,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396167.103, "dur": 1.052, "args": { "External id": 20772,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396177.848, "dur": 0.948, "args": { "External id": 20773,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396188.860, "dur": 1.723, "args": { "External id": 20774,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396202.249, "dur": 1.618, "args": { "External id": 20775,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3366 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651396314.517, "dur": 2605.028, "args": { "External id": 20776,"Record function id": 0, "Ev Idx": 3367 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.15)", "pid": 1336757, "tid": 1381170, "ts": 1295651396333.348, "dur": 984.342, "args": { "External id": 20777,"Record function id": 0, "Ev Idx": 3368 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.15)", "pid": 1336757, "tid": 1381170, "ts": 1295651396347.310, "dur": 303.930, "args": { "External id": 20778,"Record function id": 0, "Ev Idx": 3369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651396425.712, "dur": 5.107, "args": { "External id": 20779,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651396433.923, "dur": 1.166, "args": { "External id": 20780,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651396436.555, "dur": 1.277, "args": { "External id": 20781,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651396439.462, "dur": 1.370, "args": { "External id": 20782,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651396444.203, "dur": 1.014, "args": { "External id": 20783,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651396446.413, "dur": 1.177, "args": { "External id": 20784,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651396449.055, "dur": 1.403, "args": { "External id": 20785,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651396451.697, "dur": 1.534, "args": { "External id": 20786,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651396456.612, "dur": 1.936, "args": { "External id": 20787,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651396460.239, "dur": 0.984, "args": { "External id": 20788,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3379 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651396478.938, "dur": 145.495, "args": { "External id": 20789,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651396494.799, "dur": 125.520, "args": { "External id": 20790,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651396510.995, "dur": 11.804, "args": { "External id": 20791,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651396525.750, "dur": 66.017, "args": { "External id": 20792,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651396528.287, "dur": 63.127, "args": { "External id": 20793,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396531.811, "dur": 5.492, "args": { "External id": 20794,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651396541.200, "dur": 49.560, "args": { "External id": 20795,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3386 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.14", "pid": 1336757, "tid": 1381170, "ts": 1295651396726.135, "dur": 584.264, "args": { "External id": 20796,"Record function id": 0, "Ev Idx": 3387 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.14)", "pid": 1336757, "tid": 1381170, "ts": 1295651396741.321, "dur": 557.431, "args": { "External id": 20797,"Record function id": 0, "Ev Idx": 3388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651396794.894, "dur": 4.833, "args": { "External id": 20798,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651396815.247, "dur": 23.079, "args": { "External id": 20799,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396819.417, "dur": 1.910, "args": { "External id": 20800,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396823.047, "dur": 0.497, "args": { "External id": 20801,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396824.540, "dur": 0.419, "args": { "External id": 20802,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396825.938, "dur": 0.384, "args": { "External id": 20803,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396827.224, "dur": 0.886, "args": { "External id": 20804,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396829.306, "dur": 0.883, "args": { "External id": 20805,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396831.073, "dur": 0.993, "args": { "External id": 20806,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396833.238, "dur": 0.507, "args": { "External id": 20807,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396834.849, "dur": 0.542, "args": { "External id": 20808,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651396848.141, "dur": 27.923, "args": { "External id": 20809,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3400 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651396903.056, "dur": 146.003, "args": { "External id": 20810,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651396912.370, "dur": 3.028, "args": { "External id": 20811,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651396920.123, "dur": 9.271, "args": { "External id": 20812,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651396924.001, "dur": 4.989, "args": { "External id": 20813,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396927.169, "dur": 0.571, "args": { "External id": 20814,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651396936.051, "dur": 24.704, "args": { "External id": 20815,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396937.541, "dur": 0.522, "args": { "External id": 20816,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396939.225, "dur": 0.444, "args": { "External id": 20817,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396940.624, "dur": 0.784, "args": { "External id": 20818,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396942.755, "dur": 0.884, "args": { "External id": 20819,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396944.591, "dur": 0.485, "args": { "External id": 20820,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396946.080, "dur": 0.540, "args": { "External id": 20821,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396947.837, "dur": 1.157, "args": { "External id": 20822,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396950.113, "dur": 0.910, "args": { "External id": 20823,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651396952.190, "dur": 0.591, "args": { "External id": 20824,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651396969.572, "dur": 69.552, "args": { "External id": 20825,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3416 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651397097.294, "dur": 113.927, "args": { "External id": 20826,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3417 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651397126.530, "dur": 81.194, "args": { "External id": 20827,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3418, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651397135.692, "dur": 67.610, "args": { "External id": 20828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3419 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651397241.697, "dur": 3.040, "args": { "External id": 20829,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3420, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651397325.528, "dur": 1573.650, "args": { "External id": 20830,"Sequence number": 246572, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3421 } }, { "ph": "f", "id": 196, "pid": 1336757, "tid": 1381170, "ts": 1295651397325.528, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651397431.138, "dur": 101.654, "args": { "External id": 20831,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3422 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651397569.832, "dur": 38.966, "args": { "External id": 20832,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651397623.388, "dur": 47.644, "args": { "External id": 20833,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651397679.950, "dur": 32.035, "args": { "External id": 20834,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651397717.725, "dur": 44.720, "args": { "External id": 20835,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651397769.751, "dur": 27.657, "args": { "External id": 20836,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651397804.886, "dur": 41.223, "args": { "External id": 20837,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3428 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651397869.670, "dur": 22.217, "args": { "External id": 20838,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3429 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651397913.011, "dur": 27.575, "args": { "External id": 20839,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3430 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651397959.820, "dur": 19.205, "args": { "External id": 20840,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3431 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651398047.213, "dur": 19.748, "args": { "External id": 20841,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651398077.351, "dur": 35.116, "args": { "External id": 20842,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651398115.894, "dur": 32.490, "args": { "External id": 20843,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3434 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651398181.845, "dur": 189.728, "args": { "External id": 20844,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651398278.930, "dur": 6.475, "args": { "External id": 20845,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651398287.471, "dur": 2.836, "args": { "External id": 20846,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3437 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651398403.264, "dur": 27.515, "args": { "External id": 20847,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3438 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651398441.693, "dur": 14.987, "args": { "External id": 20848,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651398464.805, "dur": 40.559, "args": { "External id": 20849,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651398512.468, "dur": 33.618, "args": { "External id": 20850,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651398552.248, "dur": 22.119, "args": { "External id": 20851,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651398578.147, "dur": 28.838, "args": { "External id": 20852,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651398613.381, "dur": 20.970, "args": { "External id": 20853,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651398640.769, "dur": 29.011, "args": { "External id": 20854,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3445 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651398688.452, "dur": 31.968, "args": { "External id": 20855,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3446 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651398744.825, "dur": 29.718, "args": { "External id": 20856,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3447 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651398790.075, "dur": 18.491, "args": { "External id": 20857,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3448 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651398823.297, "dur": 15.962, "args": { "External id": 20858,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3449 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651398852.641, "dur": 16.795, "args": { "External id": 20859,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3450 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651398940.784, "dur": 18.861, "args": { "External id": 20860,"Record function id": 0, "Ev Idx": 3451 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651398944.753, "dur": 13.968, "args": { "External id": 20861,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651398948.838, "dur": 8.723, "args": { "External id": 20862,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3453 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651398950.129, "dur": 7.340, "args": { "External id": 20863,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3454 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651398963.441, "dur": 4.732, "args": { "External id": 20864,"Record function id": 0, "Ev Idx": 3455 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651398964.767, "dur": 2.865, "args": { "External id": 20865,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651398965.586, "dur": 1.565, "args": { "External id": 20866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3457 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651398966.056, "dur": 1.026, "args": { "External id": 20867,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3458 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651398971.448, "dur": 3.965, "args": { "External id": 20868,"Record function id": 0, "Ev Idx": 3459 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651398972.599, "dur": 2.362, "args": { "External id": 20869,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651398973.134, "dur": 1.383, "args": { "External id": 20870,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3461 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651398973.717, "dur": 0.706, "args": { "External id": 20871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3462 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651398978.626, "dur": 4.607, "args": { "External id": 20872,"Record function id": 0, "Ev Idx": 3463 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651398979.773, "dur": 3.046, "args": { "External id": 20873,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651398980.652, "dur": 1.755, "args": { "External id": 20874,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3465 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651398981.280, "dur": 1.040, "args": { "External id": 20875,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3466 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651399024.229, "dur": 6.813, "args": { "External id": 20876,"Record function id": 0, "Ev Idx": 3467 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651399025.970, "dur": 4.400, "args": { "External id": 20877,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651399027.252, "dur": 2.252, "args": { "External id": 20878,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3469 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651399027.879, "dur": 1.434, "args": { "External id": 20879,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3470 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651399034.347, "dur": 4.278, "args": { "External id": 20880,"Record function id": 0, "Ev Idx": 3471 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651399035.793, "dur": 2.415, "args": { "External id": 20881,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651399036.374, "dur": 1.420, "args": { "External id": 20882,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3473 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651399036.893, "dur": 0.813, "args": { "External id": 20883,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3474 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651399042.155, "dur": 4.354, "args": { "External id": 20884,"Record function id": 0, "Ev Idx": 3475 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651399043.472, "dur": 2.642, "args": { "External id": 20885,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651399044.073, "dur": 1.628, "args": { "External id": 20886,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3477 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651399044.641, "dur": 0.980, "args": { "External id": 20887,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3478 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651399049.710, "dur": 3.903, "args": { "External id": 20888,"Record function id": 0, "Ev Idx": 3479 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651399050.938, "dur": 2.255, "args": { "External id": 20889,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651399051.433, "dur": 1.356, "args": { "External id": 20890,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3481 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651399051.824, "dur": 0.899, "args": { "External id": 20891,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3482 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651399056.762, "dur": 3.358, "args": { "External id": 20892,"Record function id": 0, "Ev Idx": 3483 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651399057.731, "dur": 1.973, "args": { "External id": 20893,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651399058.193, "dur": 1.087, "args": { "External id": 20894,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3485 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651399058.534, "dur": 0.680, "args": { "External id": 20895,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3486 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651399063.969, "dur": 36537.490, "args": { "External id": 20896,"Record function id": 0, "Sequence number": 246571, "Fwd thread id": 1, "Ev Idx": 3487 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651399065.157, "dur": 36528.338, "args": { "External id": 20897,"Sequence number": 246571, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3488 } }, { "ph": "f", "id": 197, "pid": 1336757, "tid": 1381170, "ts": 1295651399065.157, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.15)", "pid": 1336757, "tid": 1381170, "ts": 1295651399093.603, "dur": 34.438, "args": { "External id": 20898,"Record function id": 0, "Ev Idx": 3489 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.15)", "pid": 1336757, "tid": 1381170, "ts": 1295651399135.400, "dur": 59.928, "args": { "External id": 20899,"Record function id": 0, "Ev Idx": 3490 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.15)", "pid": 1336757, "tid": 1381170, "ts": 1295651399201.364, "dur": 36384.909, "args": { "External id": 20900,"Record function id": 0, "Ev Idx": 3491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651399306.205, "dur": 7.513, "args": { "External id": 20901,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651399323.409, "dur": 4.980, "args": { "External id": 20902,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3493 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651399343.259, "dur": 35453.486, "args": { "External id": 20903,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651399356.504, "dur": 35431.996, "args": { "External id": 20904,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651399404.197, "dur": 13.954, "args": { "External id": 20905,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651399423.835, "dur": 35326.994, "args": { "External id": 20906,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651399426.530, "dur": 35323.732, "args": { "External id": 20907,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651399430.538, "dur": 5.474, "args": { "External id": 20908,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651399437.845, "dur": 35308.797, "args": { "External id": 20909,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651434882.035, "dur": 8.985, "args": { "External id": 20910,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651434884.819, "dur": 5.885, "args": { "External id": 20911,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3502 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651434917.083, "dur": 387.216, "args": { "External id": 20912,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3503 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651434947.305, "dur": 351.996, "args": { "External id": 20913,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3504, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651434959.094, "dur": 334.172, "args": { "External id": 20914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3505 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651435329.365, "dur": 2.755, "args": { "External id": 20915,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3506, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651435388.392, "dur": 6.713, "args": { "External id": 20916,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651435438.876, "dur": 1.686, "args": { "External id": 20917,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651435455.534, "dur": 1.482, "args": { "External id": 20918,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651435467.778, "dur": 1.273, "args": { "External id": 20919,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651435479.217, "dur": 1.074, "args": { "External id": 20920,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651435489.713, "dur": 0.902, "args": { "External id": 20921,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651435501.318, "dur": 1.069, "args": { "External id": 20922,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651435513.147, "dur": 1.884, "args": { "External id": 20923,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651435526.390, "dur": 1.386, "args": { "External id": 20924,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3515 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651435614.387, "dur": 2693.942, "args": { "External id": 20925,"Record function id": 0, "Ev Idx": 3516 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.14)", "pid": 1336757, "tid": 1381170, "ts": 1295651435632.326, "dur": 995.411, "args": { "External id": 20926,"Record function id": 0, "Ev Idx": 3517 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.14)", "pid": 1336757, "tid": 1381170, "ts": 1295651435645.879, "dur": 292.882, "args": { "External id": 20927,"Record function id": 0, "Ev Idx": 3518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651435720.082, "dur": 4.518, "args": { "External id": 20928,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651435727.380, "dur": 1.403, "args": { "External id": 20929,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651435730.711, "dur": 1.084, "args": { "External id": 20930,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651435733.234, "dur": 1.503, "args": { "External id": 20931,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651435738.242, "dur": 1.209, "args": { "External id": 20932,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651435740.851, "dur": 1.256, "args": { "External id": 20933,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651435743.625, "dur": 1.068, "args": { "External id": 20934,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651435745.994, "dur": 1.149, "args": { "External id": 20935,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651435750.391, "dur": 1.856, "args": { "External id": 20936,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651435753.733, "dur": 1.400, "args": { "External id": 20937,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3528 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651435772.439, "dur": 141.451, "args": { "External id": 20938,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651435787.608, "dur": 122.173, "args": { "External id": 20939,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651435804.358, "dur": 11.598, "args": { "External id": 20940,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651435818.580, "dur": 63.712, "args": { "External id": 20941,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651435823.597, "dur": 58.378, "args": { "External id": 20942,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651435827.259, "dur": 5.687, "args": { "External id": 20943,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651435834.590, "dur": 46.854, "args": { "External id": 20944,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3535 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.13", "pid": 1336757, "tid": 1381170, "ts": 1295651436069.499, "dur": 550.694, "args": { "External id": 20945,"Record function id": 0, "Ev Idx": 3536 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.13)", "pid": 1336757, "tid": 1381170, "ts": 1295651436087.047, "dur": 520.826, "args": { "External id": 20946,"Record function id": 0, "Ev Idx": 3537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651436144.281, "dur": 5.809, "args": { "External id": 20947,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651436166.232, "dur": 25.656, "args": { "External id": 20948,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436170.675, "dur": 2.430, "args": { "External id": 20949,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436174.658, "dur": 0.389, "args": { "External id": 20950,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436176.162, "dur": 0.401, "args": { "External id": 20951,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436178.451, "dur": 0.847, "args": { "External id": 20952,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436180.169, "dur": 0.543, "args": { "External id": 20953,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436181.434, "dur": 0.608, "args": { "External id": 20954,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436183.245, "dur": 1.030, "args": { "External id": 20955,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436185.416, "dur": 0.772, "args": { "External id": 20956,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436187.374, "dur": 0.592, "args": { "External id": 20957,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651436201.357, "dur": 45.504, "args": { "External id": 20958,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3549 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651436280.696, "dur": 107.347, "args": { "External id": 20959,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651436291.237, "dur": 4.504, "args": { "External id": 20960,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651436304.385, "dur": 10.455, "args": { "External id": 20961,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651436308.415, "dur": 6.036, "args": { "External id": 20962,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436311.854, "dur": 0.766, "args": { "External id": 20963,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651436324.367, "dur": 24.846, "args": { "External id": 20964,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436326.203, "dur": 0.449, "args": { "External id": 20965,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436327.974, "dur": 0.793, "args": { "External id": 20966,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436330.008, "dur": 0.561, "args": { "External id": 20967,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436331.655, "dur": 1.053, "args": { "External id": 20968,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436333.992, "dur": 0.860, "args": { "External id": 20969,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436335.820, "dur": 0.942, "args": { "External id": 20970,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436338.013, "dur": 0.801, "args": { "External id": 20971,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436339.974, "dur": 0.598, "args": { "External id": 20972,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651436341.860, "dur": 0.760, "args": { "External id": 20973,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651436360.485, "dur": 20.299, "args": { "External id": 20974,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3565 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651436431.253, "dur": 109.394, "args": { "External id": 20975,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3566 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651436457.942, "dur": 79.531, "args": { "External id": 20976,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3567, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651436468.477, "dur": 64.991, "args": { "External id": 20977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3568 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651436556.881, "dur": 1.705, "args": { "External id": 20978,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3569, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651436634.129, "dur": 1653.334, "args": { "External id": 20979,"Sequence number": 246570, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3570 } }, { "ph": "f", "id": 198, "pid": 1336757, "tid": 1381170, "ts": 1295651436634.129, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651436739.511, "dur": 99.751, "args": { "External id": 20980,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3571 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651436876.305, "dur": 37.656, "args": { "External id": 20981,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651436929.118, "dur": 46.066, "args": { "External id": 20982,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437041.000, "dur": 40.107, "args": { "External id": 20983,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437088.806, "dur": 45.269, "args": { "External id": 20984,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437141.016, "dur": 26.458, "args": { "External id": 20985,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437174.586, "dur": 41.830, "args": { "External id": 20986,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3577 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651437257.868, "dur": 25.083, "args": { "External id": 20987,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3578 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651437301.655, "dur": 26.729, "args": { "External id": 20988,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3579 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651437351.089, "dur": 19.833, "args": { "External id": 20989,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3580 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651437382.976, "dur": 15.953, "args": { "External id": 20990,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437408.267, "dur": 33.483, "args": { "External id": 20991,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437444.971, "dur": 32.821, "args": { "External id": 20992,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3583 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651437528.302, "dur": 167.181, "args": { "External id": 20993,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651437606.666, "dur": 5.293, "args": { "External id": 20994,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651437613.751, "dur": 1.677, "args": { "External id": 20995,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3586 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651437726.442, "dur": 25.103, "args": { "External id": 20996,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3587 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651437761.860, "dur": 14.515, "args": { "External id": 20997,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437785.840, "dur": 35.020, "args": { "External id": 20998,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437827.131, "dur": 33.525, "args": { "External id": 20999,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437866.265, "dur": 21.932, "args": { "External id": 21000,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437892.205, "dur": 29.179, "args": { "External id": 21001,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437927.456, "dur": 20.971, "args": { "External id": 21002,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651437954.610, "dur": 62.870, "args": { "External id": 21003,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3594 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651438042.534, "dur": 25.788, "args": { "External id": 21004,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3595 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651438093.881, "dur": 40.091, "args": { "External id": 21005,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3596 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651438156.246, "dur": 18.941, "args": { "External id": 21006,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3597 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651438191.098, "dur": 14.661, "args": { "External id": 21007,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3598 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651438218.434, "dur": 34.554, "args": { "External id": 21008,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3599 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438331.385, "dur": 14.805, "args": { "External id": 21009,"Record function id": 0, "Ev Idx": 3600 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438334.487, "dur": 10.798, "args": { "External id": 21010,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438338.547, "dur": 5.833, "args": { "External id": 21011,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3602 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438339.683, "dur": 4.604, "args": { "External id": 21012,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3603 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438349.919, "dur": 4.854, "args": { "External id": 21013,"Record function id": 0, "Ev Idx": 3604 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438351.236, "dur": 3.090, "args": { "External id": 21014,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438352.188, "dur": 1.672, "args": { "External id": 21015,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3606 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438352.850, "dur": 0.936, "args": { "External id": 21016,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3607 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438358.154, "dur": 4.285, "args": { "External id": 21017,"Record function id": 0, "Ev Idx": 3608 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438359.356, "dur": 2.599, "args": { "External id": 21018,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438359.933, "dur": 1.590, "args": { "External id": 21019,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3610 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438360.466, "dur": 0.943, "args": { "External id": 21020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3611 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438365.690, "dur": 4.296, "args": { "External id": 21021,"Record function id": 0, "Ev Idx": 3612 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438367.127, "dur": 2.397, "args": { "External id": 21022,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438367.951, "dur": 1.186, "args": { "External id": 21023,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3614 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438368.242, "dur": 0.778, "args": { "External id": 21024,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3615 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438373.100, "dur": 4.607, "args": { "External id": 21025,"Record function id": 0, "Ev Idx": 3616 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438374.605, "dur": 2.653, "args": { "External id": 21026,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438375.134, "dur": 1.731, "args": { "External id": 21027,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3618 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438375.616, "dur": 1.174, "args": { "External id": 21028,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3619 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438380.832, "dur": 3.968, "args": { "External id": 21029,"Record function id": 0, "Ev Idx": 3620 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438382.025, "dur": 2.342, "args": { "External id": 21030,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438382.712, "dur": 1.243, "args": { "External id": 21031,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3622 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438383.149, "dur": 0.705, "args": { "External id": 21032,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3623 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438387.967, "dur": 3.799, "args": { "External id": 21033,"Record function id": 0, "Ev Idx": 3624 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438389.260, "dur": 2.091, "args": { "External id": 21034,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438389.823, "dur": 1.148, "args": { "External id": 21035,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3626 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438390.107, "dur": 0.800, "args": { "External id": 21036,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3627 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438394.924, "dur": 3.814, "args": { "External id": 21037,"Record function id": 0, "Ev Idx": 3628 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438396.291, "dur": 2.023, "args": { "External id": 21038,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438396.854, "dur": 1.031, "args": { "External id": 21039,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3630 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438397.122, "dur": 0.698, "args": { "External id": 21040,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3631 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438402.187, "dur": 3.923, "args": { "External id": 21041,"Record function id": 0, "Ev Idx": 3632 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651438403.449, "dur": 2.191, "args": { "External id": 21042,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438403.917, "dur": 1.320, "args": { "External id": 21043,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3634 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651438404.283, "dur": 0.880, "args": { "External id": 21044,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3635 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651438409.583, "dur": 36435.481, "args": { "External id": 21045,"Record function id": 0, "Sequence number": 246569, "Fwd thread id": 1, "Ev Idx": 3636 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651438410.925, "dur": 36425.980, "args": { "External id": 21046,"Sequence number": 246569, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3637 } }, { "ph": "f", "id": 199, "pid": 1336757, "tid": 1381170, "ts": 1295651438410.925, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.14)", "pid": 1336757, "tid": 1381170, "ts": 1295651438438.962, "dur": 33.445, "args": { "External id": 21047,"Record function id": 0, "Ev Idx": 3638 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.14)", "pid": 1336757, "tid": 1381170, "ts": 1295651438479.781, "dur": 59.167, "args": { "External id": 21048,"Record function id": 0, "Ev Idx": 3639 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.14)", "pid": 1336757, "tid": 1381170, "ts": 1295651438544.935, "dur": 36284.499, "args": { "External id": 21049,"Record function id": 0, "Ev Idx": 3640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651438628.973, "dur": 6.999, "args": { "External id": 21050,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651438644.908, "dur": 4.655, "args": { "External id": 21051,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3642 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651438663.699, "dur": 35414.034, "args": { "External id": 21052,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651438676.550, "dur": 35392.611, "args": { "External id": 21053,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651438722.973, "dur": 13.467, "args": { "External id": 21054,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651438742.366, "dur": 35286.433, "args": { "External id": 21055,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651438744.684, "dur": 35283.463, "args": { "External id": 21056,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651438748.308, "dur": 4.736, "args": { "External id": 21057,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651438754.564, "dur": 35270.129, "args": { "External id": 21058,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651474164.044, "dur": 8.684, "args": { "External id": 21059,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651474166.563, "dur": 5.840, "args": { "External id": 21060,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3651 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651474201.823, "dur": 355.739, "args": { "External id": 21061,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3652 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651474244.546, "dur": 308.218, "args": { "External id": 21062,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3653, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651474256.351, "dur": 291.250, "args": { "External id": 21063,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3654 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651474577.911, "dur": 2.684, "args": { "External id": 21064,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3655, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651474635.606, "dur": 6.589, "args": { "External id": 21065,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651474685.596, "dur": 2.002, "args": { "External id": 21066,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651474703.125, "dur": 1.429, "args": { "External id": 21067,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651474716.675, "dur": 1.325, "args": { "External id": 21068,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651474728.028, "dur": 0.970, "args": { "External id": 21069,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651474738.813, "dur": 0.654, "args": { "External id": 21070,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651474749.130, "dur": 1.005, "args": { "External id": 21071,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651474760.075, "dur": 1.980, "args": { "External id": 21072,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651474771.955, "dur": 1.595, "args": { "External id": 21073,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3664 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651474857.938, "dur": 2669.764, "args": { "External id": 21074,"Record function id": 0, "Ev Idx": 3665 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.13)", "pid": 1336757, "tid": 1381170, "ts": 1295651474877.116, "dur": 966.304, "args": { "External id": 21075,"Record function id": 0, "Ev Idx": 3666 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.13)", "pid": 1336757, "tid": 1381170, "ts": 1295651474891.717, "dur": 364.811, "args": { "External id": 21076,"Record function id": 0, "Ev Idx": 3667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651474964.271, "dur": 4.219, "args": { "External id": 21077,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651474971.666, "dur": 1.790, "args": { "External id": 21078,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651474975.316, "dur": 1.056, "args": { "External id": 21079,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651474977.883, "dur": 1.318, "args": { "External id": 21080,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651475030.107, "dur": 1.699, "args": { "External id": 21081,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651475035.180, "dur": 1.812, "args": { "External id": 21082,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651475038.646, "dur": 1.143, "args": { "External id": 21083,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651475041.083, "dur": 0.807, "args": { "External id": 21084,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651475045.326, "dur": 1.144, "args": { "External id": 21085,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651475047.816, "dur": 1.196, "args": { "External id": 21086,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3677 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651475067.493, "dur": 143.144, "args": { "External id": 21087,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651475083.365, "dur": 122.834, "args": { "External id": 21088,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651475100.977, "dur": 11.514, "args": { "External id": 21089,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651475115.169, "dur": 64.302, "args": { "External id": 21090,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651475117.447, "dur": 61.729, "args": { "External id": 21091,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475121.028, "dur": 5.875, "args": { "External id": 21092,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651475128.525, "dur": 50.100, "args": { "External id": 21093,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3684 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.12", "pid": 1336757, "tid": 1381170, "ts": 1295651475339.577, "dur": 495.857, "args": { "External id": 21094,"Record function id": 0, "Ev Idx": 3685 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.12)", "pid": 1336757, "tid": 1381170, "ts": 1295651475356.798, "dur": 466.783, "args": { "External id": 21095,"Record function id": 0, "Ev Idx": 3686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651475413.345, "dur": 5.512, "args": { "External id": 21096,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651475433.625, "dur": 22.751, "args": { "External id": 21097,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475437.770, "dur": 1.873, "args": { "External id": 21098,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475441.085, "dur": 0.252, "args": { "External id": 21099,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475442.290, "dur": 0.197, "args": { "External id": 21100,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475443.337, "dur": 0.550, "args": { "External id": 21101,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475444.762, "dur": 0.649, "args": { "External id": 21102,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475446.515, "dur": 0.899, "args": { "External id": 21103,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475448.984, "dur": 0.666, "args": { "External id": 21104,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475450.516, "dur": 0.700, "args": { "External id": 21105,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475452.285, "dur": 0.395, "args": { "External id": 21106,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651475465.462, "dur": 30.141, "args": { "External id": 21107,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3698 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651475524.986, "dur": 88.653, "args": { "External id": 21108,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651475534.913, "dur": 3.805, "args": { "External id": 21109,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651475543.574, "dur": 9.831, "args": { "External id": 21110,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651475547.668, "dur": 5.357, "args": { "External id": 21111,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475550.996, "dur": 0.455, "args": { "External id": 21112,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651475559.690, "dur": 20.631, "args": { "External id": 21113,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475560.992, "dur": 1.007, "args": { "External id": 21114,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475563.266, "dur": 0.457, "args": { "External id": 21115,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475565.029, "dur": 0.533, "args": { "External id": 21116,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475566.596, "dur": 0.721, "args": { "External id": 21117,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475568.326, "dur": 0.390, "args": { "External id": 21118,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475569.996, "dur": 0.461, "args": { "External id": 21119,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475571.322, "dur": 0.401, "args": { "External id": 21120,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475572.894, "dur": 0.435, "args": { "External id": 21121,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651475574.196, "dur": 0.812, "args": { "External id": 21122,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651475589.466, "dur": 16.785, "args": { "External id": 21123,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3714 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651475652.818, "dur": 108.475, "args": { "External id": 21124,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3715 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651475679.053, "dur": 79.079, "args": { "External id": 21125,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3716, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651475687.634, "dur": 66.802, "args": { "External id": 21126,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3717 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651475776.123, "dur": 1.733, "args": { "External id": 21127,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3718, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651475849.971, "dur": 1658.395, "args": { "External id": 21128,"Sequence number": 246568, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3719 } }, { "ph": "f", "id": 200, "pid": 1336757, "tid": 1381170, "ts": 1295651475849.971, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651475950.819, "dur": 154.007, "args": { "External id": 21129,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3720 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651476148.384, "dur": 38.520, "args": { "External id": 21130,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651476203.082, "dur": 69.104, "args": { "External id": 21131,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651476285.566, "dur": 36.032, "args": { "External id": 21132,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651476327.988, "dur": 44.863, "args": { "External id": 21133,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651476380.272, "dur": 27.988, "args": { "External id": 21134,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651476415.405, "dur": 40.653, "args": { "External id": 21135,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3726 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651476483.402, "dur": 23.908, "args": { "External id": 21136,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3727 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651476526.959, "dur": 28.231, "args": { "External id": 21137,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3728 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651476577.220, "dur": 20.994, "args": { "External id": 21138,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3729 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651476609.604, "dur": 17.268, "args": { "External id": 21139,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651476635.496, "dur": 31.238, "args": { "External id": 21140,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651476669.744, "dur": 32.461, "args": { "External id": 21141,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3732 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651476727.388, "dur": 164.513, "args": { "External id": 21142,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651476803.359, "dur": 5.774, "args": { "External id": 21143,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651476810.984, "dur": 2.656, "args": { "External id": 21144,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3735 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651476920.576, "dur": 24.718, "args": { "External id": 21145,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3736 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651476960.982, "dur": 14.834, "args": { "External id": 21146,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651477033.131, "dur": 45.510, "args": { "External id": 21147,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651477086.044, "dur": 34.478, "args": { "External id": 21148,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651477128.286, "dur": 22.002, "args": { "External id": 21149,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651477154.826, "dur": 28.667, "args": { "External id": 21150,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651477189.813, "dur": 20.952, "args": { "External id": 21151,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651477216.912, "dur": 43.509, "args": { "External id": 21152,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3743 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651477285.800, "dur": 25.927, "args": { "External id": 21153,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3744 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651477340.672, "dur": 31.901, "args": { "External id": 21154,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3745 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651477392.258, "dur": 18.184, "args": { "External id": 21155,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3746 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651477428.371, "dur": 18.659, "args": { "External id": 21156,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3747 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651477460.080, "dur": 16.526, "args": { "External id": 21157,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3748 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477550.246, "dur": 14.788, "args": { "External id": 21158,"Record function id": 0, "Ev Idx": 3749 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477553.067, "dur": 11.001, "args": { "External id": 21159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477556.997, "dur": 6.111, "args": { "External id": 21160,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3751 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477558.361, "dur": 4.656, "args": { "External id": 21161,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3752 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477568.977, "dur": 4.081, "args": { "External id": 21162,"Record function id": 0, "Ev Idx": 3753 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477570.018, "dur": 2.545, "args": { "External id": 21163,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477570.654, "dur": 1.430, "args": { "External id": 21164,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3755 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477571.232, "dur": 0.784, "args": { "External id": 21165,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3756 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477576.321, "dur": 3.946, "args": { "External id": 21166,"Record function id": 0, "Ev Idx": 3757 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477577.415, "dur": 2.416, "args": { "External id": 21167,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477577.925, "dur": 1.508, "args": { "External id": 21168,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3759 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477578.439, "dur": 0.874, "args": { "External id": 21169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3760 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477583.461, "dur": 3.835, "args": { "External id": 21170,"Record function id": 0, "Ev Idx": 3761 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477584.692, "dur": 2.139, "args": { "External id": 21171,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477585.345, "dur": 1.027, "args": { "External id": 21172,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3763 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477585.642, "dur": 0.620, "args": { "External id": 21173,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3764 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477590.417, "dur": 3.414, "args": { "External id": 21174,"Record function id": 0, "Ev Idx": 3765 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477591.341, "dur": 2.037, "args": { "External id": 21175,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477591.843, "dur": 1.098, "args": { "External id": 21176,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3767 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477592.117, "dur": 0.758, "args": { "External id": 21177,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3768 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477596.890, "dur": 4.031, "args": { "External id": 21178,"Record function id": 0, "Ev Idx": 3769 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477597.997, "dur": 2.468, "args": { "External id": 21179,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477598.832, "dur": 1.219, "args": { "External id": 21180,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3771 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477599.309, "dur": 0.667, "args": { "External id": 21181,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3772 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477604.051, "dur": 4.130, "args": { "External id": 21182,"Record function id": 0, "Ev Idx": 3773 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477605.041, "dur": 2.714, "args": { "External id": 21183,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477605.541, "dur": 1.817, "args": { "External id": 21184,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3775 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477606.056, "dur": 1.237, "args": { "External id": 21185,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3776 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477611.227, "dur": 3.327, "args": { "External id": 21186,"Record function id": 0, "Ev Idx": 3777 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477612.139, "dur": 1.978, "args": { "External id": 21187,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477612.627, "dur": 1.046, "args": { "External id": 21188,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3779 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477612.891, "dur": 0.705, "args": { "External id": 21189,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3780 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477617.644, "dur": 5.600, "args": { "External id": 21190,"Record function id": 0, "Ev Idx": 3781 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651477618.547, "dur": 4.262, "args": { "External id": 21191,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477619.078, "dur": 3.286, "args": { "External id": 21192,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3783 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651477621.491, "dur": 0.809, "args": { "External id": 21193,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3784 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651477627.106, "dur": 37991.056, "args": { "External id": 21194,"Record function id": 0, "Sequence number": 246567, "Fwd thread id": 1, "Ev Idx": 3785 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651477628.210, "dur": 37981.625, "args": { "External id": 21195,"Sequence number": 246567, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3786 } }, { "ph": "f", "id": 201, "pid": 1336757, "tid": 1381170, "ts": 1295651477628.210, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.13)", "pid": 1336757, "tid": 1381170, "ts": 1295651477654.982, "dur": 35.975, "args": { "External id": 21196,"Record function id": 0, "Ev Idx": 3787 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.13)", "pid": 1336757, "tid": 1381170, "ts": 1295651477699.004, "dur": 60.842, "args": { "External id": 21197,"Record function id": 0, "Ev Idx": 3788 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.13)", "pid": 1336757, "tid": 1381170, "ts": 1295651477766.265, "dur": 37836.280, "args": { "External id": 21198,"Record function id": 0, "Ev Idx": 3789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651477851.119, "dur": 6.947, "args": { "External id": 21199,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651477866.704, "dur": 4.775, "args": { "External id": 21200,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3791 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651477884.583, "dur": 36891.172, "args": { "External id": 21201,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651477897.671, "dur": 36869.522, "args": { "External id": 21202,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651477941.684, "dur": 13.191, "args": { "External id": 21203,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651477960.642, "dur": 36769.749, "args": { "External id": 21204,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651477962.915, "dur": 36766.958, "args": { "External id": 21205,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651477966.017, "dur": 4.978, "args": { "External id": 21206,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651477972.628, "dur": 36753.642, "args": { "External id": 21207,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651514862.604, "dur": 8.631, "args": { "External id": 21208,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651514865.374, "dur": 5.548, "args": { "External id": 21209,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3800 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651514900.098, "dur": 425.845, "args": { "External id": 21210,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3801 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651514927.676, "dur": 392.884, "args": { "External id": 21211,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3802, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651514938.545, "dur": 376.164, "args": { "External id": 21212,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3803 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651515345.862, "dur": 2.422, "args": { "External id": 21213,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3804, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651515409.069, "dur": 6.673, "args": { "External id": 21214,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651515458.158, "dur": 1.637, "args": { "External id": 21215,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651515474.794, "dur": 1.061, "args": { "External id": 21216,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651515486.603, "dur": 1.149, "args": { "External id": 21217,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651515496.854, "dur": 0.886, "args": { "External id": 21218,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651515507.426, "dur": 0.908, "args": { "External id": 21219,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651515518.203, "dur": 1.171, "args": { "External id": 21220,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651515531.417, "dur": 1.182, "args": { "External id": 21221,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651515542.096, "dur": 1.275, "args": { "External id": 21222,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3813 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651515632.214, "dur": 2632.671, "args": { "External id": 21223,"Record function id": 0, "Ev Idx": 3814 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.12)", "pid": 1336757, "tid": 1381170, "ts": 1295651515650.240, "dur": 975.979, "args": { "External id": 21224,"Record function id": 0, "Ev Idx": 3815 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.12)", "pid": 1336757, "tid": 1381170, "ts": 1295651515664.084, "dur": 289.576, "args": { "External id": 21225,"Record function id": 0, "Ev Idx": 3816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651515736.724, "dur": 4.198, "args": { "External id": 21226,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651515743.979, "dur": 1.573, "args": { "External id": 21227,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651515747.279, "dur": 1.366, "args": { "External id": 21228,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651515750.166, "dur": 1.407, "args": { "External id": 21229,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651515753.130, "dur": 1.500, "args": { "External id": 21230,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651515757.955, "dur": 1.216, "args": { "External id": 21231,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651515760.519, "dur": 1.018, "args": { "External id": 21232,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651515762.948, "dur": 1.164, "args": { "External id": 21233,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651515765.343, "dur": 1.094, "args": { "External id": 21234,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651515769.244, "dur": 1.237, "args": { "External id": 21235,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3826 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651515788.450, "dur": 139.455, "args": { "External id": 21236,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651515803.219, "dur": 120.485, "args": { "External id": 21237,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651515819.034, "dur": 12.230, "args": { "External id": 21238,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651515834.107, "dur": 60.497, "args": { "External id": 21239,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651515836.390, "dur": 57.949, "args": { "External id": 21240,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651515839.774, "dur": 4.906, "args": { "External id": 21241,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651515846.269, "dur": 47.628, "args": { "External id": 21242,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3833 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.11", "pid": 1336757, "tid": 1381170, "ts": 1295651516088.572, "dur": 530.124, "args": { "External id": 21243,"Record function id": 0, "Ev Idx": 3834 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.11)", "pid": 1336757, "tid": 1381170, "ts": 1295651516104.359, "dur": 502.898, "args": { "External id": 21244,"Record function id": 0, "Ev Idx": 3835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651516159.616, "dur": 6.082, "args": { "External id": 21245,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651516181.470, "dur": 25.127, "args": { "External id": 21246,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516185.986, "dur": 1.888, "args": { "External id": 21247,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516189.645, "dur": 0.311, "args": { "External id": 21248,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516191.560, "dur": 0.852, "args": { "External id": 21249,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516193.773, "dur": 0.760, "args": { "External id": 21250,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516195.571, "dur": 0.325, "args": { "External id": 21251,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516197.020, "dur": 0.760, "args": { "External id": 21252,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516198.874, "dur": 0.340, "args": { "External id": 21253,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516200.773, "dur": 0.696, "args": { "External id": 21254,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516202.553, "dur": 0.440, "args": { "External id": 21255,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651516215.914, "dur": 48.206, "args": { "External id": 21256,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3847 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651516297.724, "dur": 95.052, "args": { "External id": 21257,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651516307.877, "dur": 4.223, "args": { "External id": 21258,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651516316.875, "dur": 10.077, "args": { "External id": 21259,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651516320.820, "dur": 5.751, "args": { "External id": 21260,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516324.227, "dur": 0.697, "args": { "External id": 21261,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651516333.115, "dur": 23.199, "args": { "External id": 21262,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516334.952, "dur": 0.586, "args": { "External id": 21263,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516336.906, "dur": 0.445, "args": { "External id": 21264,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516338.771, "dur": 0.832, "args": { "External id": 21265,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516340.581, "dur": 0.360, "args": { "External id": 21266,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516342.025, "dur": 0.664, "args": { "External id": 21267,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516343.858, "dur": 0.295, "args": { "External id": 21268,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516345.497, "dur": 0.853, "args": { "External id": 21269,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516347.438, "dur": 0.450, "args": { "External id": 21270,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651516348.985, "dur": 0.818, "args": { "External id": 21271,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651516366.685, "dur": 18.498, "args": { "External id": 21272,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3863 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651516437.639, "dur": 106.181, "args": { "External id": 21273,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3864 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651516461.717, "dur": 79.084, "args": { "External id": 21274,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3865, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651516471.291, "dur": 65.689, "args": { "External id": 21275,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3866 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651516558.335, "dur": 1.776, "args": { "External id": 21276,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3867, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651516633.104, "dur": 1611.985, "args": { "External id": 21277,"Sequence number": 246566, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3868 } }, { "ph": "f", "id": 202, "pid": 1336757, "tid": 1381170, "ts": 1295651516633.104, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651516737.445, "dur": 98.368, "args": { "External id": 21278,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3869 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651516872.302, "dur": 39.004, "args": { "External id": 21279,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651516926.373, "dur": 46.267, "args": { "External id": 21280,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517034.445, "dur": 41.313, "args": { "External id": 21281,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517084.791, "dur": 45.632, "args": { "External id": 21282,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517138.506, "dur": 28.166, "args": { "External id": 21283,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517173.958, "dur": 41.389, "args": { "External id": 21284,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3875 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651517257.011, "dur": 26.114, "args": { "External id": 21285,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3876 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651517303.827, "dur": 28.489, "args": { "External id": 21286,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3877 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651517353.464, "dur": 20.356, "args": { "External id": 21287,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3878 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651517387.326, "dur": 15.386, "args": { "External id": 21288,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517412.435, "dur": 33.831, "args": { "External id": 21289,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517449.378, "dur": 31.903, "args": { "External id": 21290,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3881 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651517505.588, "dur": 165.945, "args": { "External id": 21291,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651517581.849, "dur": 6.086, "args": { "External id": 21292,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651517589.588, "dur": 2.162, "args": { "External id": 21293,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3884 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651517700.088, "dur": 25.068, "args": { "External id": 21294,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3885 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651517738.844, "dur": 15.607, "args": { "External id": 21295,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517761.929, "dur": 34.207, "args": { "External id": 21296,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517801.569, "dur": 32.787, "args": { "External id": 21297,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517840.657, "dur": 21.909, "args": { "External id": 21298,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517867.028, "dur": 29.177, "args": { "External id": 21299,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517901.770, "dur": 20.477, "args": { "External id": 21300,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651517928.063, "dur": 28.804, "args": { "External id": 21301,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3892 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651517973.980, "dur": 58.673, "args": { "External id": 21302,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3893 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651518054.522, "dur": 24.860, "args": { "External id": 21303,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3894 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651518095.426, "dur": 33.226, "args": { "External id": 21304,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3895 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651518153.793, "dur": 16.522, "args": { "External id": 21305,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3896 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651518185.292, "dur": 16.578, "args": { "External id": 21306,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3897 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518289.734, "dur": 14.860, "args": { "External id": 21307,"Record function id": 0, "Ev Idx": 3898 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518292.824, "dur": 10.774, "args": { "External id": 21308,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518296.816, "dur": 5.932, "args": { "External id": 21309,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3900 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518298.407, "dur": 4.250, "args": { "External id": 21310,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3901 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518308.334, "dur": 4.915, "args": { "External id": 21311,"Record function id": 0, "Ev Idx": 3902 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518309.506, "dur": 3.259, "args": { "External id": 21312,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518310.279, "dur": 2.009, "args": { "External id": 21313,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3904 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518311.389, "dur": 0.825, "args": { "External id": 21314,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3905 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518316.528, "dur": 4.285, "args": { "External id": 21315,"Record function id": 0, "Ev Idx": 3906 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518317.622, "dur": 2.707, "args": { "External id": 21316,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518318.294, "dur": 1.584, "args": { "External id": 21317,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3908 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518318.867, "dur": 0.918, "args": { "External id": 21318,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3909 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518323.896, "dur": 3.477, "args": { "External id": 21319,"Record function id": 0, "Ev Idx": 3910 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518324.920, "dur": 2.020, "args": { "External id": 21320,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518325.431, "dur": 1.060, "args": { "External id": 21321,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3912 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518325.742, "dur": 0.660, "args": { "External id": 21322,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3913 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518330.464, "dur": 3.775, "args": { "External id": 21323,"Record function id": 0, "Ev Idx": 3914 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518331.450, "dur": 2.319, "args": { "External id": 21324,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518332.192, "dur": 1.173, "args": { "External id": 21325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3916 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518332.528, "dur": 0.771, "args": { "External id": 21326,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3917 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518337.373, "dur": 4.553, "args": { "External id": 21327,"Record function id": 0, "Ev Idx": 3918 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518338.362, "dur": 3.086, "args": { "External id": 21328,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518339.097, "dur": 1.923, "args": { "External id": 21329,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3920 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518339.543, "dur": 1.411, "args": { "External id": 21330,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3921 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518345.129, "dur": 5.756, "args": { "External id": 21331,"Record function id": 0, "Ev Idx": 3922 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518346.041, "dur": 4.385, "args": { "External id": 21332,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518346.722, "dur": 3.253, "args": { "External id": 21333,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3924 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518349.184, "dur": 0.701, "args": { "External id": 21334,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3925 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518353.905, "dur": 3.420, "args": { "External id": 21335,"Record function id": 0, "Ev Idx": 3926 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518354.776, "dur": 2.091, "args": { "External id": 21336,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518355.290, "dur": 1.142, "args": { "External id": 21337,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3928 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518355.571, "dur": 0.754, "args": { "External id": 21338,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3929 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518360.471, "dur": 7.460, "args": { "External id": 21339,"Record function id": 0, "Ev Idx": 3930 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651518361.673, "dur": 5.795, "args": { "External id": 21340,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518362.158, "dur": 4.921, "args": { "External id": 21341,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3932 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651518366.105, "dur": 0.899, "args": { "External id": 21342,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3933 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651518371.764, "dur": 36662.768, "args": { "External id": 21343,"Record function id": 0, "Sequence number": 246565, "Fwd thread id": 1, "Ev Idx": 3934 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651518373.306, "dur": 36602.062, "args": { "External id": 21344,"Sequence number": 246565, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3935 } }, { "ph": "f", "id": 203, "pid": 1336757, "tid": 1381170, "ts": 1295651518373.306, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.12)", "pid": 1336757, "tid": 1381170, "ts": 1295651518400.079, "dur": 34.180, "args": { "External id": 21345,"Record function id": 0, "Ev Idx": 3936 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.12)", "pid": 1336757, "tid": 1381170, "ts": 1295651518441.127, "dur": 60.996, "args": { "External id": 21346,"Record function id": 0, "Ev Idx": 3937 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.12)", "pid": 1336757, "tid": 1381170, "ts": 1295651518509.723, "dur": 36458.287, "args": { "External id": 21347,"Record function id": 0, "Ev Idx": 3938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651518593.307, "dur": 6.617, "args": { "External id": 21348,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651518608.865, "dur": 5.119, "args": { "External id": 21349,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3940 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651518627.640, "dur": 35510.370, "args": { "External id": 21350,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651518640.355, "dur": 35488.772, "args": { "External id": 21351,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651518685.448, "dur": 13.389, "args": { "External id": 21352,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651518704.933, "dur": 35387.055, "args": { "External id": 21353,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651518707.342, "dur": 35383.961, "args": { "External id": 21354,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651518711.005, "dur": 5.342, "args": { "External id": 21355,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651518718.088, "dur": 35369.579, "args": { "External id": 21356,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651554227.203, "dur": 20.942, "args": { "External id": 21357,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651554240.713, "dur": 6.841, "args": { "External id": 21358,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3949 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651554276.166, "dur": 410.222, "args": { "External id": 21359,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3950 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651554304.406, "dur": 377.184, "args": { "External id": 21360,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3951, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651554315.148, "dur": 360.654, "args": { "External id": 21361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3952 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651554707.558, "dur": 2.743, "args": { "External id": 21362,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3953, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651554766.894, "dur": 6.710, "args": { "External id": 21363,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651554822.468, "dur": 1.749, "args": { "External id": 21364,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651554839.904, "dur": 1.398, "args": { "External id": 21365,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651554851.889, "dur": 1.648, "args": { "External id": 21366,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651554864.711, "dur": 1.219, "args": { "External id": 21367,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651554876.155, "dur": 1.556, "args": { "External id": 21368,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651554887.420, "dur": 1.257, "args": { "External id": 21369,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651554899.113, "dur": 1.384, "args": { "External id": 21370,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651554909.964, "dur": 1.047, "args": { "External id": 21371,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3962 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651555050.576, "dur": 2583.928, "args": { "External id": 21372,"Record function id": 0, "Ev Idx": 3963 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.11)", "pid": 1336757, "tid": 1381170, "ts": 1295651555071.506, "dur": 906.112, "args": { "External id": 21373,"Record function id": 0, "Ev Idx": 3964 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.11)", "pid": 1336757, "tid": 1381170, "ts": 1295651555085.400, "dur": 320.604, "args": { "External id": 21374,"Record function id": 0, "Ev Idx": 3965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651555161.651, "dur": 5.730, "args": { "External id": 21375,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651555170.415, "dur": 1.922, "args": { "External id": 21376,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651555174.242, "dur": 1.182, "args": { "External id": 21377,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651555177.039, "dur": 1.686, "args": { "External id": 21378,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651555181.858, "dur": 0.707, "args": { "External id": 21379,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651555183.970, "dur": 1.490, "args": { "External id": 21380,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651555186.919, "dur": 1.450, "args": { "External id": 21381,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651555189.742, "dur": 1.733, "args": { "External id": 21382,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651555195.016, "dur": 1.098, "args": { "External id": 21383,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651555197.450, "dur": 1.960, "args": { "External id": 21384,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3975 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651555217.302, "dur": 158.549, "args": { "External id": 21385,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651555247.409, "dur": 124.349, "args": { "External id": 21386,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651555263.648, "dur": 13.070, "args": { "External id": 21387,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651555279.914, "dur": 63.513, "args": { "External id": 21388,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651555282.412, "dur": 60.691, "args": { "External id": 21389,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555285.568, "dur": 5.736, "args": { "External id": 21390,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651555292.911, "dur": 49.308, "args": { "External id": 21391,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3982 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.10", "pid": 1336757, "tid": 1381170, "ts": 1295651555485.860, "dur": 484.512, "args": { "External id": 21392,"Record function id": 0, "Ev Idx": 3983 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.10)", "pid": 1336757, "tid": 1381170, "ts": 1295651555499.595, "dur": 459.616, "args": { "External id": 21393,"Record function id": 0, "Ev Idx": 3984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651555556.245, "dur": 4.821, "args": { "External id": 21394,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651555575.896, "dur": 24.817, "args": { "External id": 21395,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555580.665, "dur": 1.643, "args": { "External id": 21396,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555584.365, "dur": 0.309, "args": { "External id": 21397,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555586.181, "dur": 0.431, "args": { "External id": 21398,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555587.815, "dur": 0.957, "args": { "External id": 21399,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555589.995, "dur": 0.644, "args": { "External id": 21400,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555591.866, "dur": 0.569, "args": { "External id": 21401,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555593.379, "dur": 0.606, "args": { "External id": 21402,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555595.136, "dur": 0.527, "args": { "External id": 21403,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555596.516, "dur": 0.456, "args": { "External id": 21404,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651555609.658, "dur": 27.291, "args": { "External id": 21405,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3996 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651555666.029, "dur": 89.010, "args": { "External id": 21406,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651555675.642, "dur": 3.853, "args": { "External id": 21407,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651555683.921, "dur": 10.226, "args": { "External id": 21408,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651555688.152, "dur": 5.603, "args": { "External id": 21409,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555691.618, "dur": 0.787, "args": { "External id": 21410,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651555700.503, "dur": 21.116, "args": { "External id": 21411,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555702.084, "dur": 0.622, "args": { "External id": 21412,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555704.027, "dur": 0.308, "args": { "External id": 21413,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555705.302, "dur": 0.665, "args": { "External id": 21414,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555706.986, "dur": 0.717, "args": { "External id": 21415,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555708.834, "dur": 0.901, "args": { "External id": 21416,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555711.027, "dur": 0.406, "args": { "External id": 21417,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555712.549, "dur": 0.534, "args": { "External id": 21418,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555714.181, "dur": 0.488, "args": { "External id": 21419,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651555715.798, "dur": 0.450, "args": { "External id": 21420,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651555730.855, "dur": 17.152, "args": { "External id": 21421,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4012 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651555794.857, "dur": 105.213, "args": { "External id": 21422,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4013 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651555819.703, "dur": 77.126, "args": { "External id": 21423,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4014, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651555828.378, "dur": 64.945, "args": { "External id": 21424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4015 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651555915.352, "dur": 2.000, "args": { "External id": 21425,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4016, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651556035.643, "dur": 1579.331, "args": { "External id": 21426,"Sequence number": 246564, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4017 } }, { "ph": "f", "id": 204, "pid": 1336757, "tid": 1381170, "ts": 1295651556035.643, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651556145.753, "dur": 119.708, "args": { "External id": 21427,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4018 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651556308.816, "dur": 40.635, "args": { "External id": 21428,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651556365.697, "dur": 52.416, "args": { "External id": 21429,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651556427.872, "dur": 34.123, "args": { "External id": 21430,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651556468.477, "dur": 44.885, "args": { "External id": 21431,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651556520.542, "dur": 27.478, "args": { "External id": 21432,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651556555.114, "dur": 41.840, "args": { "External id": 21433,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4024 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651556620.925, "dur": 22.738, "args": { "External id": 21434,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4025 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651556662.328, "dur": 27.157, "args": { "External id": 21435,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4026 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651556709.998, "dur": 20.649, "args": { "External id": 21436,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4027 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651556744.762, "dur": 15.574, "args": { "External id": 21437,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651556768.101, "dur": 28.578, "args": { "External id": 21438,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651556799.866, "dur": 31.621, "args": { "External id": 21439,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4030 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651556858.176, "dur": 203.139, "args": { "External id": 21440,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651556934.257, "dur": 5.838, "args": { "External id": 21441,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651556942.222, "dur": 2.055, "args": { "External id": 21442,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4033 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651557094.266, "dur": 26.010, "args": { "External id": 21443,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4034 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651557132.749, "dur": 15.463, "args": { "External id": 21444,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651557156.896, "dur": 40.757, "args": { "External id": 21445,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651557203.258, "dur": 48.902, "args": { "External id": 21446,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651557262.235, "dur": 25.283, "args": { "External id": 21447,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651557292.234, "dur": 29.187, "args": { "External id": 21448,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651557327.228, "dur": 24.490, "args": { "External id": 21449,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651557357.310, "dur": 28.711, "args": { "External id": 21450,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4041 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651557405.233, "dur": 22.752, "args": { "External id": 21451,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4042 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651557445.671, "dur": 23.295, "args": { "External id": 21452,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4043 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651557483.116, "dur": 32.300, "args": { "External id": 21453,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4044 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651557538.215, "dur": 15.941, "args": { "External id": 21454,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4045 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651557568.087, "dur": 16.920, "args": { "External id": 21455,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4046 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557656.408, "dur": 17.676, "args": { "External id": 21456,"Record function id": 0, "Ev Idx": 4047 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557659.537, "dur": 13.655, "args": { "External id": 21457,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557663.720, "dur": 8.586, "args": { "External id": 21458,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4049 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557665.246, "dur": 6.966, "args": { "External id": 21459,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4050 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557678.000, "dur": 4.819, "args": { "External id": 21460,"Record function id": 0, "Ev Idx": 4051 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557679.490, "dur": 2.832, "args": { "External id": 21461,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557680.236, "dur": 1.516, "args": { "External id": 21462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4053 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557680.911, "dur": 0.765, "args": { "External id": 21463,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4054 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557686.102, "dur": 3.954, "args": { "External id": 21464,"Record function id": 0, "Ev Idx": 4055 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557687.226, "dur": 2.358, "args": { "External id": 21465,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557687.699, "dur": 1.415, "args": { "External id": 21466,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4057 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557688.251, "dur": 0.775, "args": { "External id": 21467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4058 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557693.287, "dur": 3.929, "args": { "External id": 21468,"Record function id": 0, "Ev Idx": 4059 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557694.506, "dur": 2.295, "args": { "External id": 21469,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557695.008, "dur": 1.328, "args": { "External id": 21470,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4061 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557695.629, "dur": 0.608, "args": { "External id": 21471,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4062 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557700.287, "dur": 3.208, "args": { "External id": 21472,"Record function id": 0, "Ev Idx": 4063 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557701.252, "dur": 1.816, "args": { "External id": 21473,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557701.734, "dur": 0.927, "args": { "External id": 21474,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4065 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557702.025, "dur": 0.563, "args": { "External id": 21475,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4066 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557706.561, "dur": 3.793, "args": { "External id": 21476,"Record function id": 0, "Ev Idx": 4067 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557707.717, "dur": 2.219, "args": { "External id": 21477,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557708.175, "dur": 1.325, "args": { "External id": 21478,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4069 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557708.683, "dur": 0.727, "args": { "External id": 21479,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4070 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557713.692, "dur": 3.356, "args": { "External id": 21480,"Record function id": 0, "Ev Idx": 4071 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557714.733, "dur": 1.880, "args": { "External id": 21481,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557715.214, "dur": 0.966, "args": { "External id": 21482,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4073 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557715.519, "dur": 0.588, "args": { "External id": 21483,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4074 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557720.161, "dur": 3.493, "args": { "External id": 21484,"Record function id": 0, "Ev Idx": 4075 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557721.042, "dur": 2.168, "args": { "External id": 21485,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557721.794, "dur": 0.975, "args": { "External id": 21486,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4077 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557722.191, "dur": 0.509, "args": { "External id": 21487,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4078 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557726.690, "dur": 3.857, "args": { "External id": 21488,"Record function id": 0, "Ev Idx": 4079 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651557727.654, "dur": 2.448, "args": { "External id": 21489,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557728.123, "dur": 1.569, "args": { "External id": 21490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4081 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651557728.897, "dur": 0.719, "args": { "External id": 21491,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4082 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651557733.925, "dur": 35914.258, "args": { "External id": 21492,"Record function id": 0, "Sequence number": 246563, "Fwd thread id": 1, "Ev Idx": 4083 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651557735.398, "dur": 35904.507, "args": { "External id": 21493,"Sequence number": 246563, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4084 } }, { "ph": "f", "id": 205, "pid": 1336757, "tid": 1381170, "ts": 1295651557735.398, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.11)", "pid": 1336757, "tid": 1381170, "ts": 1295651557762.777, "dur": 35.306, "args": { "External id": 21494,"Record function id": 0, "Ev Idx": 4085 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.11)", "pid": 1336757, "tid": 1381170, "ts": 1295651557806.157, "dur": 57.169, "args": { "External id": 21495,"Record function id": 0, "Ev Idx": 4086 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.11)", "pid": 1336757, "tid": 1381170, "ts": 1295651557869.540, "dur": 35762.201, "args": { "External id": 21496,"Record function id": 0, "Ev Idx": 4087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651557954.902, "dur": 6.207, "args": { "External id": 21497,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651557970.180, "dur": 4.791, "args": { "External id": 21498,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4089 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651558029.406, "dur": 34822.172, "args": { "External id": 21499,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651558043.117, "dur": 34800.724, "args": { "External id": 21500,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651558088.427, "dur": 15.582, "args": { "External id": 21501,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651558110.120, "dur": 34694.301, "args": { "External id": 21502,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651558112.735, "dur": 34691.049, "args": { "External id": 21503,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651558116.478, "dur": 6.031, "args": { "External id": 21504,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651558145.524, "dur": 34654.707, "args": { "External id": 21505,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651592939.032, "dur": 9.876, "args": { "External id": 21506,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651592941.643, "dur": 6.943, "args": { "External id": 21507,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4098 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651592976.153, "dur": 372.880, "args": { "External id": 21508,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4099 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651593041.270, "dur": 302.948, "args": { "External id": 21509,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4100, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651593054.843, "dur": 283.643, "args": { "External id": 21510,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4101 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651593370.478, "dur": 2.309, "args": { "External id": 21511,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4102, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651593433.757, "dur": 6.570, "args": { "External id": 21512,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651593484.378, "dur": 1.168, "args": { "External id": 21513,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651593500.798, "dur": 1.161, "args": { "External id": 21514,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651593512.987, "dur": 1.136, "args": { "External id": 21515,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651593525.602, "dur": 0.967, "args": { "External id": 21516,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651593537.392, "dur": 0.963, "args": { "External id": 21517,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651593550.432, "dur": 1.518, "args": { "External id": 21518,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651593561.736, "dur": 1.027, "args": { "External id": 21519,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651593572.114, "dur": 1.189, "args": { "External id": 21520,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4111 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651593661.127, "dur": 2685.776, "args": { "External id": 21521,"Record function id": 0, "Ev Idx": 4112 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.10)", "pid": 1336757, "tid": 1381170, "ts": 1295651593680.714, "dur": 993.556, "args": { "External id": 21522,"Record function id": 0, "Ev Idx": 4113 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.10)", "pid": 1336757, "tid": 1381170, "ts": 1295651593694.392, "dur": 347.507, "args": { "External id": 21523,"Record function id": 0, "Ev Idx": 4114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651593768.966, "dur": 4.158, "args": { "External id": 21524,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651593776.029, "dur": 1.120, "args": { "External id": 21525,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651593780.914, "dur": 1.307, "args": { "External id": 21526,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651593783.582, "dur": 1.183, "args": { "External id": 21527,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651593786.138, "dur": 1.254, "args": { "External id": 21528,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651593788.826, "dur": 1.580, "args": { "External id": 21529,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651593793.849, "dur": 1.127, "args": { "External id": 21530,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651593796.208, "dur": 1.631, "args": { "External id": 21531,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651593799.030, "dur": 1.545, "args": { "External id": 21532,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651593802.006, "dur": 1.367, "args": { "External id": 21533,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4124 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651593822.511, "dur": 138.366, "args": { "External id": 21534,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651593837.474, "dur": 119.318, "args": { "External id": 21535,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651593852.190, "dur": 12.351, "args": { "External id": 21536,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651593868.021, "dur": 61.135, "args": { "External id": 21537,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651593870.807, "dur": 58.075, "args": { "External id": 21538,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651593874.572, "dur": 5.002, "args": { "External id": 21539,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651593881.128, "dur": 47.206, "args": { "External id": 21540,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4131 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.9", "pid": 1336757, "tid": 1381170, "ts": 1295651594124.523, "dur": 542.524, "args": { "External id": 21541,"Record function id": 0, "Ev Idx": 4132 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.9)", "pid": 1336757, "tid": 1381170, "ts": 1295651594142.068, "dur": 513.131, "args": { "External id": 21542,"Record function id": 0, "Ev Idx": 4133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651594201.515, "dur": 5.362, "args": { "External id": 21543,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651594223.106, "dur": 45.682, "args": { "External id": 21544,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594241.443, "dur": 2.317, "args": { "External id": 21545,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594246.873, "dur": 0.340, "args": { "External id": 21546,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594248.617, "dur": 0.347, "args": { "External id": 21547,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594250.484, "dur": 0.795, "args": { "External id": 21548,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594252.603, "dur": 0.386, "args": { "External id": 21549,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594254.111, "dur": 0.950, "args": { "External id": 21550,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594260.788, "dur": 0.290, "args": { "External id": 21551,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594262.545, "dur": 1.190, "args": { "External id": 21552,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594264.894, "dur": 0.265, "args": { "External id": 21553,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651594279.400, "dur": 32.772, "args": { "External id": 21554,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4145 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651594345.036, "dur": 93.919, "args": { "External id": 21555,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651594355.364, "dur": 3.879, "args": { "External id": 21556,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651594363.886, "dur": 9.987, "args": { "External id": 21557,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651594368.409, "dur": 5.052, "args": { "External id": 21558,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594371.489, "dur": 0.686, "args": { "External id": 21559,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651594382.668, "dur": 22.614, "args": { "External id": 21560,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594384.493, "dur": 0.883, "args": { "External id": 21561,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594386.720, "dur": 0.440, "args": { "External id": 21562,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594388.444, "dur": 0.589, "args": { "External id": 21563,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594390.354, "dur": 0.197, "args": { "External id": 21564,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594391.855, "dur": 0.485, "args": { "External id": 21565,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594393.195, "dur": 0.324, "args": { "External id": 21566,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594394.569, "dur": 0.859, "args": { "External id": 21567,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594396.824, "dur": 0.354, "args": { "External id": 21568,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651594398.350, "dur": 0.850, "args": { "External id": 21569,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651594414.179, "dur": 17.469, "args": { "External id": 21570,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4161 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651594483.185, "dur": 108.098, "args": { "External id": 21571,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4162 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651594508.368, "dur": 79.782, "args": { "External id": 21572,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4163, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651594517.458, "dur": 67.013, "args": { "External id": 21573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4164 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651594607.308, "dur": 1.891, "args": { "External id": 21574,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4165, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651594681.257, "dur": 1645.444, "args": { "External id": 21575,"Sequence number": 246562, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4166 } }, { "ph": "f", "id": 206, "pid": 1336757, "tid": 1381170, "ts": 1295651594681.257, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651594784.897, "dur": 98.769, "args": { "External id": 21576,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4167 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651594919.086, "dur": 37.671, "args": { "External id": 21577,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651594971.449, "dur": 107.283, "args": { "External id": 21578,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651595093.241, "dur": 34.911, "args": { "External id": 21579,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651595134.449, "dur": 46.867, "args": { "External id": 21580,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651595188.115, "dur": 28.165, "args": { "External id": 21581,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651595223.620, "dur": 58.749, "args": { "External id": 21582,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4173 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651595313.079, "dur": 23.693, "args": { "External id": 21583,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4174 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651595365.631, "dur": 28.883, "args": { "External id": 21584,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4175 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651595415.145, "dur": 18.599, "args": { "External id": 21585,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4176 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651595448.038, "dur": 15.114, "args": { "External id": 21586,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651595472.308, "dur": 31.630, "args": { "External id": 21587,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651595506.928, "dur": 32.663, "args": { "External id": 21588,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4179 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651595565.709, "dur": 164.336, "args": { "External id": 21589,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651595640.848, "dur": 6.179, "args": { "External id": 21590,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651595649.088, "dur": 2.367, "args": { "External id": 21591,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4182 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651595759.030, "dur": 22.959, "args": { "External id": 21592,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4183 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651595793.014, "dur": 15.416, "args": { "External id": 21593,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651595815.440, "dur": 33.318, "args": { "External id": 21594,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651595854.183, "dur": 33.120, "args": { "External id": 21595,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651595893.735, "dur": 21.678, "args": { "External id": 21596,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651595919.821, "dur": 29.245, "args": { "External id": 21597,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651595955.394, "dur": 20.998, "args": { "External id": 21598,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651596031.937, "dur": 35.923, "args": { "External id": 21599,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4190 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651596090.211, "dur": 24.517, "args": { "External id": 21600,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4191 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651596134.873, "dur": 32.649, "args": { "External id": 21601,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4192 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651596191.812, "dur": 23.623, "args": { "External id": 21602,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4193 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651596247.010, "dur": 18.558, "args": { "External id": 21603,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4194 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651596281.515, "dur": 16.851, "args": { "External id": 21604,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4195 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596368.966, "dur": 15.372, "args": { "External id": 21605,"Record function id": 0, "Ev Idx": 4196 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596372.577, "dur": 10.985, "args": { "External id": 21606,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596376.631, "dur": 6.012, "args": { "External id": 21607,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4198 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596378.126, "dur": 4.428, "args": { "External id": 21608,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4199 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596387.998, "dur": 5.440, "args": { "External id": 21609,"Record function id": 0, "Ev Idx": 4200 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596389.701, "dur": 3.258, "args": { "External id": 21610,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596390.723, "dur": 1.722, "args": { "External id": 21611,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4202 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596391.387, "dur": 0.991, "args": { "External id": 21612,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4203 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596396.814, "dur": 3.750, "args": { "External id": 21613,"Record function id": 0, "Ev Idx": 4204 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596397.833, "dur": 2.282, "args": { "External id": 21614,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596398.362, "dur": 1.316, "args": { "External id": 21615,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4206 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596398.906, "dur": 0.679, "args": { "External id": 21616,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4207 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596403.871, "dur": 3.571, "args": { "External id": 21617,"Record function id": 0, "Ev Idx": 4208 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596405.078, "dur": 1.912, "args": { "External id": 21618,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596405.545, "dur": 0.993, "args": { "External id": 21619,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4210 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596405.818, "dur": 0.615, "args": { "External id": 21620,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4211 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596410.562, "dur": 3.296, "args": { "External id": 21621,"Record function id": 0, "Ev Idx": 4212 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596411.592, "dur": 1.808, "args": { "External id": 21622,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596412.158, "dur": 0.802, "args": { "External id": 21623,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4214 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596412.455, "dur": 0.443, "args": { "External id": 21624,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4215 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596417.015, "dur": 3.664, "args": { "External id": 21625,"Record function id": 0, "Ev Idx": 4216 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596417.894, "dur": 2.342, "args": { "External id": 21626,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596418.348, "dur": 1.466, "args": { "External id": 21627,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4218 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596418.964, "dur": 0.785, "args": { "External id": 21628,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4219 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596423.990, "dur": 3.876, "args": { "External id": 21629,"Record function id": 0, "Ev Idx": 4220 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596424.857, "dur": 2.594, "args": { "External id": 21630,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596425.802, "dur": 1.209, "args": { "External id": 21631,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4222 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596426.373, "dur": 0.573, "args": { "External id": 21632,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4223 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596430.940, "dur": 3.647, "args": { "External id": 21633,"Record function id": 0, "Ev Idx": 4224 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596432.031, "dur": 2.131, "args": { "External id": 21634,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596432.725, "dur": 0.993, "args": { "External id": 21635,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4226 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596433.139, "dur": 0.503, "args": { "External id": 21636,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4227 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596437.618, "dur": 5.420, "args": { "External id": 21637,"Record function id": 0, "Ev Idx": 4228 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651596438.478, "dur": 4.144, "args": { "External id": 21638,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596438.927, "dur": 3.246, "args": { "External id": 21639,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4230 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651596441.325, "dur": 0.746, "args": { "External id": 21640,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4231 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651596447.015, "dur": 35821.137, "args": { "External id": 21641,"Record function id": 0, "Sequence number": 246561, "Fwd thread id": 1, "Ev Idx": 4232 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651596448.125, "dur": 35810.384, "args": { "External id": 21642,"Sequence number": 246561, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4233 } }, { "ph": "f", "id": 207, "pid": 1336757, "tid": 1381170, "ts": 1295651596448.125, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.10)", "pid": 1336757, "tid": 1381170, "ts": 1295651596478.965, "dur": 37.369, "args": { "External id": 21643,"Record function id": 0, "Ev Idx": 4234 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.10)", "pid": 1336757, "tid": 1381170, "ts": 1295651596523.487, "dur": 62.961, "args": { "External id": 21644,"Record function id": 0, "Ev Idx": 4235 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.10)", "pid": 1336757, "tid": 1381170, "ts": 1295651596592.448, "dur": 35656.360, "args": { "External id": 21645,"Record function id": 0, "Ev Idx": 4236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651596678.013, "dur": 6.735, "args": { "External id": 21646,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651596693.725, "dur": 4.698, "args": { "External id": 21647,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4238 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651596712.583, "dur": 34705.975, "args": { "External id": 21648,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651596725.422, "dur": 34685.423, "args": { "External id": 21649,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651596771.452, "dur": 15.068, "args": { "External id": 21650,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651596792.428, "dur": 34580.423, "args": { "External id": 21651,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651596796.772, "dur": 34575.552, "args": { "External id": 21652,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651596800.712, "dur": 5.812, "args": { "External id": 21653,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651596808.112, "dur": 34560.801, "args": { "External id": 21654,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651631504.841, "dur": 8.781, "args": { "External id": 21655,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651631507.526, "dur": 5.759, "args": { "External id": 21656,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4247 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651631541.038, "dur": 379.674, "args": { "External id": 21657,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4248 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651631569.587, "dur": 346.990, "args": { "External id": 21658,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4249, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651631580.134, "dur": 330.823, "args": { "External id": 21659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4250 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651631938.088, "dur": 2.389, "args": { "External id": 21660,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4251, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632038.484, "dur": 6.730, "args": { "External id": 21661,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632089.763, "dur": 1.701, "args": { "External id": 21662,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632106.616, "dur": 1.296, "args": { "External id": 21663,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632119.874, "dur": 1.029, "args": { "External id": 21664,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632132.097, "dur": 1.112, "args": { "External id": 21665,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632142.023, "dur": 1.260, "args": { "External id": 21666,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632154.837, "dur": 0.841, "args": { "External id": 21667,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632166.165, "dur": 1.349, "args": { "External id": 21668,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632175.499, "dur": 1.500, "args": { "External id": 21669,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4260 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651632284.097, "dur": 2526.806, "args": { "External id": 21670,"Record function id": 0, "Ev Idx": 4261 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.9)", "pid": 1336757, "tid": 1381170, "ts": 1295651632302.918, "dur": 955.377, "args": { "External id": 21671,"Record function id": 0, "Ev Idx": 4262 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.9)", "pid": 1336757, "tid": 1381170, "ts": 1295651632315.433, "dur": 296.232, "args": { "External id": 21672,"Record function id": 0, "Ev Idx": 4263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651632390.597, "dur": 4.463, "args": { "External id": 21673,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651632398.016, "dur": 1.848, "args": { "External id": 21674,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651632403.082, "dur": 0.853, "args": { "External id": 21675,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651632405.597, "dur": 1.083, "args": { "External id": 21676,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651632408.026, "dur": 0.904, "args": { "External id": 21677,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651632410.313, "dur": 1.427, "args": { "External id": 21678,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651632414.840, "dur": 1.257, "args": { "External id": 21679,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651632417.557, "dur": 0.849, "args": { "External id": 21680,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651632419.644, "dur": 1.577, "args": { "External id": 21681,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651632422.722, "dur": 1.074, "args": { "External id": 21682,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4273 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651632442.657, "dur": 142.283, "args": { "External id": 21683,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651632458.043, "dur": 122.899, "args": { "External id": 21684,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651632472.855, "dur": 11.624, "args": { "External id": 21685,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651632487.265, "dur": 66.171, "args": { "External id": 21686,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651632490.037, "dur": 63.090, "args": { "External id": 21687,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632493.751, "dur": 5.329, "args": { "External id": 21688,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651632502.578, "dur": 50.016, "args": { "External id": 21689,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4280 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.8", "pid": 1336757, "tid": 1381170, "ts": 1295651632687.354, "dur": 562.226, "args": { "External id": 21690,"Record function id": 0, "Ev Idx": 4281 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.8)", "pid": 1336757, "tid": 1381170, "ts": 1295651632701.166, "dur": 519.423, "args": { "External id": 21691,"Record function id": 0, "Ev Idx": 4282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651632753.261, "dur": 4.863, "args": { "External id": 21692,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651632772.533, "dur": 22.796, "args": { "External id": 21693,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632776.778, "dur": 1.645, "args": { "External id": 21694,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632780.097, "dur": 0.427, "args": { "External id": 21695,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632781.698, "dur": 1.091, "args": { "External id": 21696,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632784.311, "dur": 0.734, "args": { "External id": 21697,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632786.009, "dur": 0.811, "args": { "External id": 21698,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632788.163, "dur": 0.324, "args": { "External id": 21699,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632789.412, "dur": 0.558, "args": { "External id": 21700,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632790.864, "dur": 0.290, "args": { "External id": 21701,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632791.866, "dur": 0.461, "args": { "External id": 21702,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651632803.969, "dur": 27.006, "args": { "External id": 21703,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4294 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651632858.587, "dur": 85.794, "args": { "External id": 21704,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651632867.474, "dur": 2.865, "args": { "External id": 21705,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651632874.992, "dur": 9.846, "args": { "External id": 21706,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651632879.205, "dur": 5.254, "args": { "External id": 21707,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632882.194, "dur": 1.026, "args": { "External id": 21708,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651632890.838, "dur": 21.479, "args": { "External id": 21709,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632892.606, "dur": 0.812, "args": { "External id": 21710,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632894.655, "dur": 0.380, "args": { "External id": 21711,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632896.277, "dur": 0.759, "args": { "External id": 21712,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632898.208, "dur": 0.405, "args": { "External id": 21713,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632899.942, "dur": 0.764, "args": { "External id": 21714,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632901.824, "dur": 0.367, "args": { "External id": 21715,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632903.413, "dur": 0.328, "args": { "External id": 21716,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632904.664, "dur": 0.440, "args": { "External id": 21717,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651632906.097, "dur": 0.586, "args": { "External id": 21718,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651632920.657, "dur": 16.723, "args": { "External id": 21719,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4310 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651633037.057, "dur": 113.879, "args": { "External id": 21720,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4311 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651633063.202, "dur": 84.229, "args": { "External id": 21721,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4312, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651633074.461, "dur": 68.941, "args": { "External id": 21722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4313 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651633166.463, "dur": 1.717, "args": { "External id": 21723,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4314, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651633265.525, "dur": 1526.299, "args": { "External id": 21724,"Sequence number": 246560, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4315 } }, { "ph": "f", "id": 208, "pid": 1336757, "tid": 1381170, "ts": 1295651633265.525, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651633372.830, "dur": 101.818, "args": { "External id": 21725,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4316 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651633510.022, "dur": 37.966, "args": { "External id": 21726,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651633563.049, "dur": 47.047, "args": { "External id": 21727,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651633619.150, "dur": 31.914, "args": { "External id": 21728,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651633657.776, "dur": 45.073, "args": { "External id": 21729,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651633709.819, "dur": 27.415, "args": { "External id": 21730,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651633744.223, "dur": 41.568, "args": { "External id": 21731,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4322 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651633810.111, "dur": 21.597, "args": { "External id": 21732,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4323 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651633849.239, "dur": 26.962, "args": { "External id": 21733,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4324 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651633897.897, "dur": 19.263, "args": { "External id": 21734,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4325 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651633929.500, "dur": 15.344, "args": { "External id": 21735,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651633952.422, "dur": 64.740, "args": { "External id": 21736,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651634023.069, "dur": 37.675, "args": { "External id": 21737,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4328 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651634089.107, "dur": 179.834, "args": { "External id": 21738,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651634163.962, "dur": 6.410, "args": { "External id": 21739,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651634172.234, "dur": 2.426, "args": { "External id": 21740,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4331 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651634301.426, "dur": 27.465, "args": { "External id": 21741,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4332 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651634339.355, "dur": 14.763, "args": { "External id": 21742,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651634362.381, "dur": 39.438, "args": { "External id": 21743,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651634407.453, "dur": 33.738, "args": { "External id": 21744,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651634447.427, "dur": 21.524, "args": { "External id": 21745,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651634475.564, "dur": 28.792, "args": { "External id": 21746,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651634510.007, "dur": 21.297, "args": { "External id": 21747,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651634536.667, "dur": 29.887, "args": { "External id": 21748,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4339 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651634586.861, "dur": 22.247, "args": { "External id": 21749,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4340 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651634624.982, "dur": 22.807, "args": { "External id": 21750,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4341 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651634663.062, "dur": 18.314, "args": { "External id": 21751,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4342 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651634708.840, "dur": 22.572, "args": { "External id": 21752,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4343 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651634748.207, "dur": 16.898, "args": { "External id": 21753,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4344 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634832.377, "dur": 18.374, "args": { "External id": 21754,"Record function id": 0, "Ev Idx": 4345 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634838.723, "dur": 11.129, "args": { "External id": 21755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634842.823, "dur": 6.163, "args": { "External id": 21756,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4347 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634844.403, "dur": 4.493, "args": { "External id": 21757,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4348 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634854.542, "dur": 4.875, "args": { "External id": 21758,"Record function id": 0, "Ev Idx": 4349 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634855.797, "dur": 3.137, "args": { "External id": 21759,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634856.761, "dur": 1.663, "args": { "External id": 21760,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4351 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634857.427, "dur": 0.930, "args": { "External id": 21761,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4352 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634862.900, "dur": 4.230, "args": { "External id": 21762,"Record function id": 0, "Ev Idx": 4353 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634863.960, "dur": 2.716, "args": { "External id": 21763,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634864.709, "dur": 1.518, "args": { "External id": 21764,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4355 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634865.549, "dur": 0.594, "args": { "External id": 21765,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4356 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634870.395, "dur": 3.562, "args": { "External id": 21766,"Record function id": 0, "Ev Idx": 4357 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634871.477, "dur": 2.066, "args": { "External id": 21767,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634872.161, "dur": 0.961, "args": { "External id": 21768,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4359 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634872.483, "dur": 0.547, "args": { "External id": 21769,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4360 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634877.064, "dur": 3.635, "args": { "External id": 21770,"Record function id": 0, "Ev Idx": 4361 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634877.985, "dur": 2.293, "args": { "External id": 21771,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634878.614, "dur": 1.245, "args": { "External id": 21772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4363 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634879.003, "dur": 0.789, "args": { "External id": 21773,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4364 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634883.827, "dur": 4.101, "args": { "External id": 21774,"Record function id": 0, "Ev Idx": 4365 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634884.892, "dur": 2.620, "args": { "External id": 21775,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634885.399, "dur": 1.700, "args": { "External id": 21776,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4367 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634886.204, "dur": 0.824, "args": { "External id": 21777,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4368 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634891.229, "dur": 3.756, "args": { "External id": 21778,"Record function id": 0, "Ev Idx": 4369 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634892.428, "dur": 2.144, "args": { "External id": 21779,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634892.964, "dur": 1.194, "args": { "External id": 21780,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4371 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634893.425, "dur": 0.666, "args": { "External id": 21781,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4372 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634898.136, "dur": 3.860, "args": { "External id": 21782,"Record function id": 0, "Ev Idx": 4373 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634899.343, "dur": 2.227, "args": { "External id": 21783,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634899.958, "dur": 1.155, "args": { "External id": 21784,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4375 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634900.498, "dur": 0.540, "args": { "External id": 21785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4376 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634905.050, "dur": 3.436, "args": { "External id": 21786,"Record function id": 0, "Ev Idx": 4377 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651634905.961, "dur": 2.124, "args": { "External id": 21787,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634906.465, "dur": 1.196, "args": { "External id": 21788,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4379 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651634906.804, "dur": 0.798, "args": { "External id": 21789,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4380 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651634912.320, "dur": 35964.838, "args": { "External id": 21790,"Record function id": 0, "Sequence number": 246559, "Fwd thread id": 1, "Ev Idx": 4381 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651634913.503, "dur": 35955.562, "args": { "External id": 21791,"Sequence number": 246559, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4382 } }, { "ph": "f", "id": 209, "pid": 1336757, "tid": 1381170, "ts": 1295651634913.503, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.9)", "pid": 1336757, "tid": 1381170, "ts": 1295651634940.785, "dur": 32.912, "args": { "External id": 21792,"Record function id": 0, "Ev Idx": 4383 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.9)", "pid": 1336757, "tid": 1381170, "ts": 1295651634980.540, "dur": 114.855, "args": { "External id": 21793,"Record function id": 0, "Ev Idx": 4384 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.9)", "pid": 1336757, "tid": 1381170, "ts": 1295651635102.882, "dur": 35758.972, "args": { "External id": 21794,"Record function id": 0, "Ev Idx": 4385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651635187.486, "dur": 7.086, "args": { "External id": 21795,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651635204.215, "dur": 5.214, "args": { "External id": 21796,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4387 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651635223.148, "dur": 34879.562, "args": { "External id": 21797,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651635251.794, "dur": 34841.397, "args": { "External id": 21798,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651635297.245, "dur": 14.783, "args": { "External id": 21799,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651635318.225, "dur": 34736.283, "args": { "External id": 21800,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651635320.797, "dur": 34732.997, "args": { "External id": 21801,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651635324.308, "dur": 5.654, "args": { "External id": 21802,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651635333.135, "dur": 34716.844, "args": { "External id": 21803,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651670196.265, "dur": 9.779, "args": { "External id": 21804,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651670199.186, "dur": 6.510, "args": { "External id": 21805,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4396 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651670244.942, "dur": 347.703, "args": { "External id": 21806,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4397 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651670273.452, "dur": 314.696, "args": { "External id": 21807,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4398, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651670287.262, "dur": 295.836, "args": { "External id": 21808,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4399 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651670611.182, "dur": 2.317, "args": { "External id": 21809,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4400, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651670670.706, "dur": 6.422, "args": { "External id": 21810,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651670719.674, "dur": 1.457, "args": { "External id": 21811,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651670736.066, "dur": 1.520, "args": { "External id": 21812,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651670748.017, "dur": 1.009, "args": { "External id": 21813,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651670760.144, "dur": 0.834, "args": { "External id": 21814,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651670770.815, "dur": 1.216, "args": { "External id": 21815,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651670781.595, "dur": 0.979, "args": { "External id": 21816,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651670792.475, "dur": 1.628, "args": { "External id": 21817,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651670804.135, "dur": 1.085, "args": { "External id": 21818,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4409 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651670890.694, "dur": 2658.315, "args": { "External id": 21819,"Record function id": 0, "Ev Idx": 4410 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.8)", "pid": 1336757, "tid": 1381170, "ts": 1295651670910.107, "dur": 961.421, "args": { "External id": 21820,"Record function id": 0, "Ev Idx": 4411 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.8)", "pid": 1336757, "tid": 1381170, "ts": 1295651670922.870, "dur": 361.163, "args": { "External id": 21821,"Record function id": 0, "Ev Idx": 4412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651671045.583, "dur": 5.144, "args": { "External id": 21822,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651671054.267, "dur": 1.521, "args": { "External id": 21823,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651671057.640, "dur": 1.316, "args": { "External id": 21824,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651671060.410, "dur": 1.650, "args": { "External id": 21825,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651671064.773, "dur": 1.761, "args": { "External id": 21826,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651671067.755, "dur": 0.991, "args": { "External id": 21827,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651671070.200, "dur": 0.534, "args": { "External id": 21828,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651671072.021, "dur": 1.613, "args": { "External id": 21829,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651671076.613, "dur": 0.492, "args": { "External id": 21830,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651671078.287, "dur": 1.125, "args": { "External id": 21831,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4422 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651671096.823, "dur": 154.804, "args": { "External id": 21832,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651671112.980, "dur": 133.783, "args": { "External id": 21833,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651671127.807, "dur": 12.175, "args": { "External id": 21834,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651671143.156, "dur": 61.337, "args": { "External id": 21835,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651671145.377, "dur": 58.822, "args": { "External id": 21836,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671148.859, "dur": 4.835, "args": { "External id": 21837,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651671155.314, "dur": 48.413, "args": { "External id": 21838,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4429 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.7", "pid": 1336757, "tid": 1381170, "ts": 1295651671364.109, "dur": 499.779, "args": { "External id": 21839,"Record function id": 0, "Ev Idx": 4430 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.7)", "pid": 1336757, "tid": 1381170, "ts": 1295651671380.907, "dur": 471.209, "args": { "External id": 21840,"Record function id": 0, "Ev Idx": 4431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651671437.133, "dur": 5.432, "args": { "External id": 21841,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651671457.662, "dur": 23.294, "args": { "External id": 21842,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671461.989, "dur": 1.769, "args": { "External id": 21843,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671465.706, "dur": 0.345, "args": { "External id": 21844,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671467.548, "dur": 0.374, "args": { "External id": 21845,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671469.131, "dur": 0.247, "args": { "External id": 21846,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671470.530, "dur": 0.713, "args": { "External id": 21847,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671472.469, "dur": 0.609, "args": { "External id": 21848,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671474.007, "dur": 0.871, "args": { "External id": 21849,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671475.917, "dur": 0.351, "args": { "External id": 21850,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671476.976, "dur": 0.940, "args": { "External id": 21851,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651671490.363, "dur": 29.574, "args": { "External id": 21852,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4443 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651671549.665, "dur": 88.446, "args": { "External id": 21853,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651671559.175, "dur": 2.946, "args": { "External id": 21854,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651671566.683, "dur": 9.816, "args": { "External id": 21855,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651671570.862, "dur": 5.200, "args": { "External id": 21856,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671573.865, "dur": 0.926, "args": { "External id": 21857,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651671582.555, "dur": 21.475, "args": { "External id": 21858,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671584.197, "dur": 0.421, "args": { "External id": 21859,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671586.315, "dur": 0.673, "args": { "External id": 21860,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671588.171, "dur": 0.550, "args": { "External id": 21861,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671590.232, "dur": 0.754, "args": { "External id": 21862,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671591.902, "dur": 0.379, "args": { "External id": 21863,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671592.961, "dur": 0.789, "args": { "External id": 21864,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671594.528, "dur": 0.498, "args": { "External id": 21865,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671595.984, "dur": 0.897, "args": { "External id": 21866,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651671598.151, "dur": 0.178, "args": { "External id": 21867,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651671614.688, "dur": 16.410, "args": { "External id": 21868,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4459 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651671682.059, "dur": 107.981, "args": { "External id": 21869,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4460 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651671708.507, "dur": 78.364, "args": { "External id": 21870,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4461, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651671717.333, "dur": 65.696, "args": { "External id": 21871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4462 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651671805.761, "dur": 2.122, "args": { "External id": 21872,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4463, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651671877.680, "dur": 1651.881, "args": { "External id": 21873,"Sequence number": 246558, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4464 } }, { "ph": "f", "id": 210, "pid": 1336757, "tid": 1381170, "ts": 1295651671877.680, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651671980.696, "dur": 151.992, "args": { "External id": 21874,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4465 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651672174.895, "dur": 38.431, "args": { "External id": 21875,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651672243.206, "dur": 54.592, "args": { "External id": 21876,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651672308.918, "dur": 32.495, "args": { "External id": 21877,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651672347.676, "dur": 44.994, "args": { "External id": 21878,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651672399.715, "dur": 27.324, "args": { "External id": 21879,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651672433.824, "dur": 42.150, "args": { "External id": 21880,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4471 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651672502.011, "dur": 24.154, "args": { "External id": 21881,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4472 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651672546.497, "dur": 29.004, "args": { "External id": 21882,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4473 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651672596.136, "dur": 19.047, "args": { "External id": 21883,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4474 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651672628.759, "dur": 16.699, "args": { "External id": 21884,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651672653.843, "dur": 30.980, "args": { "External id": 21885,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651672687.818, "dur": 33.053, "args": { "External id": 21886,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4477 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651672747.119, "dur": 158.824, "args": { "External id": 21887,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651672817.279, "dur": 6.782, "args": { "External id": 21888,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651672825.777, "dur": 1.940, "args": { "External id": 21889,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4480 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651672937.948, "dur": 23.805, "args": { "External id": 21890,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4481 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651672975.893, "dur": 66.051, "args": { "External id": 21891,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651673053.620, "dur": 49.874, "args": { "External id": 21892,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651673109.180, "dur": 35.270, "args": { "External id": 21893,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651673151.397, "dur": 22.590, "args": { "External id": 21894,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651673177.973, "dur": 29.267, "args": { "External id": 21895,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651673213.073, "dur": 35.791, "args": { "External id": 21896,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651673258.201, "dur": 32.491, "args": { "External id": 21897,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4488 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651673312.275, "dur": 25.526, "args": { "External id": 21898,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4489 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651673356.345, "dur": 23.057, "args": { "External id": 21899,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4490 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651673399.962, "dur": 27.239, "args": { "External id": 21900,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4491 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651673453.581, "dur": 15.077, "args": { "External id": 21901,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4492 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651673482.540, "dur": 16.051, "args": { "External id": 21902,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4493 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673570.425, "dur": 18.867, "args": { "External id": 21903,"Record function id": 0, "Ev Idx": 4494 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673574.019, "dur": 14.411, "args": { "External id": 21904,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673581.126, "dur": 6.389, "args": { "External id": 21905,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4496 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673582.838, "dur": 4.526, "args": { "External id": 21906,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4497 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673593.040, "dur": 4.939, "args": { "External id": 21907,"Record function id": 0, "Ev Idx": 4498 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673594.685, "dur": 2.846, "args": { "External id": 21908,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673595.398, "dur": 1.644, "args": { "External id": 21909,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4500 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673595.970, "dur": 1.001, "args": { "External id": 21910,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4501 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673601.271, "dur": 4.693, "args": { "External id": 21911,"Record function id": 0, "Ev Idx": 4502 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673602.694, "dur": 2.803, "args": { "External id": 21912,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673603.193, "dur": 1.849, "args": { "External id": 21913,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4504 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673604.001, "dur": 0.929, "args": { "External id": 21914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4505 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673609.162, "dur": 3.595, "args": { "External id": 21915,"Record function id": 0, "Ev Idx": 4506 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673610.077, "dur": 2.254, "args": { "External id": 21916,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673610.726, "dur": 1.197, "args": { "External id": 21917,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4508 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673611.066, "dur": 0.749, "args": { "External id": 21918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4509 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673615.853, "dur": 4.196, "args": { "External id": 21919,"Record function id": 0, "Ev Idx": 4510 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673616.830, "dur": 2.758, "args": { "External id": 21920,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673617.284, "dur": 1.861, "args": { "External id": 21921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4512 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673617.657, "dur": 1.417, "args": { "External id": 21922,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4513 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673623.184, "dur": 3.899, "args": { "External id": 21923,"Record function id": 0, "Ev Idx": 4514 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673624.343, "dur": 2.297, "args": { "External id": 21924,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673624.823, "dur": 1.356, "args": { "External id": 21925,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4516 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673625.422, "dur": 0.691, "args": { "External id": 21926,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4517 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673630.422, "dur": 5.573, "args": { "External id": 21927,"Record function id": 0, "Ev Idx": 4518 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673631.532, "dur": 4.011, "args": { "External id": 21928,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673632.155, "dur": 2.977, "args": { "External id": 21929,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4520 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673634.342, "dur": 0.698, "args": { "External id": 21930,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4521 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673639.051, "dur": 3.659, "args": { "External id": 21931,"Record function id": 0, "Ev Idx": 4522 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673640.238, "dur": 2.065, "args": { "External id": 21932,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673640.697, "dur": 1.198, "args": { "External id": 21933,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4524 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673640.984, "dur": 0.820, "args": { "External id": 21934,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4525 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673645.733, "dur": 3.859, "args": { "External id": 21935,"Record function id": 0, "Ev Idx": 4526 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651673646.837, "dur": 2.329, "args": { "External id": 21936,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673647.289, "dur": 1.449, "args": { "External id": 21937,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4528 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651673647.668, "dur": 0.994, "args": { "External id": 21938,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4529 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651673653.300, "dur": 36298.614, "args": { "External id": 21939,"Record function id": 0, "Sequence number": 246557, "Fwd thread id": 1, "Ev Idx": 4530 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651673655.005, "dur": 36288.551, "args": { "External id": 21940,"Sequence number": 246557, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4531 } }, { "ph": "f", "id": 211, "pid": 1336757, "tid": 1381170, "ts": 1295651673655.005, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.8)", "pid": 1336757, "tid": 1381170, "ts": 1295651673682.206, "dur": 35.855, "args": { "External id": 21941,"Record function id": 0, "Ev Idx": 4532 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.8)", "pid": 1336757, "tid": 1381170, "ts": 1295651673726.012, "dur": 58.122, "args": { "External id": 21942,"Record function id": 0, "Ev Idx": 4533 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.8)", "pid": 1336757, "tid": 1381170, "ts": 1295651673790.222, "dur": 36146.342, "args": { "External id": 21943,"Record function id": 0, "Ev Idx": 4534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651673875.978, "dur": 6.689, "args": { "External id": 21944,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651673891.668, "dur": 4.635, "args": { "External id": 21945,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4536 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651673912.306, "dur": 35229.607, "args": { "External id": 21946,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651673925.465, "dur": 35208.517, "args": { "External id": 21947,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651673970.242, "dur": 53.872, "args": { "External id": 21948,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651674031.054, "dur": 35069.793, "args": { "External id": 21949,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651674033.746, "dur": 35066.592, "args": { "External id": 21950,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651674037.895, "dur": 6.144, "args": { "External id": 21951,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651674045.443, "dur": 35051.573, "args": { "External id": 21952,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651709227.417, "dur": 20.770, "args": { "External id": 21953,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651709241.505, "dur": 6.229, "args": { "External id": 21954,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4545 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651709277.586, "dur": 383.070, "args": { "External id": 21955,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4546 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651709305.478, "dur": 350.642, "args": { "External id": 21956,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4547, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651709316.502, "dur": 333.704, "args": { "External id": 21957,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4548 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651709679.948, "dur": 2.251, "args": { "External id": 21958,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4549, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651709739.215, "dur": 6.455, "args": { "External id": 21959,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651709789.085, "dur": 1.229, "args": { "External id": 21960,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651709805.359, "dur": 1.711, "args": { "External id": 21961,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651709819.515, "dur": 0.936, "args": { "External id": 21962,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651709835.644, "dur": 1.113, "args": { "External id": 21963,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651709846.955, "dur": 1.580, "args": { "External id": 21964,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651709859.104, "dur": 0.706, "args": { "External id": 21965,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651709870.608, "dur": 0.940, "args": { "External id": 21966,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651709879.938, "dur": 1.190, "args": { "External id": 21967,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4558 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651709964.923, "dur": 2656.162, "args": { "External id": 21968,"Record function id": 0, "Ev Idx": 4559 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.7)", "pid": 1336757, "tid": 1381170, "ts": 1295651710032.184, "dur": 941.042, "args": { "External id": 21969,"Record function id": 0, "Ev Idx": 4560 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.7)", "pid": 1336757, "tid": 1381170, "ts": 1295651710046.691, "dur": 321.826, "args": { "External id": 21970,"Record function id": 0, "Ev Idx": 4561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651710125.598, "dur": 4.733, "args": { "External id": 21971,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651710134.999, "dur": 1.456, "args": { "External id": 21972,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651710138.267, "dur": 0.872, "args": { "External id": 21973,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651710140.619, "dur": 1.247, "args": { "External id": 21974,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651710143.312, "dur": 1.196, "args": { "External id": 21975,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651710147.654, "dur": 1.384, "args": { "External id": 21976,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651710150.519, "dur": 0.893, "args": { "External id": 21977,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651710152.573, "dur": 1.190, "args": { "External id": 21978,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651710154.931, "dur": 0.637, "args": { "External id": 21979,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651710158.078, "dur": 1.067, "args": { "External id": 21980,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4571 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651710175.630, "dur": 160.125, "args": { "External id": 21981,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651710191.283, "dur": 139.875, "args": { "External id": 21982,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651710206.633, "dur": 13.762, "args": { "External id": 21983,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651710223.503, "dur": 80.191, "args": { "External id": 21984,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651710226.241, "dur": 77.153, "args": { "External id": 21985,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710244.739, "dur": 6.224, "args": { "External id": 21986,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651710252.943, "dur": 49.709, "args": { "External id": 21987,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4578 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.6", "pid": 1336757, "tid": 1381170, "ts": 1295651710449.741, "dur": 515.821, "args": { "External id": 21988,"Record function id": 0, "Ev Idx": 4579 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.6)", "pid": 1336757, "tid": 1381170, "ts": 1295651710465.390, "dur": 488.812, "args": { "External id": 21989,"Record function id": 0, "Ev Idx": 4580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651710519.604, "dur": 5.283, "args": { "External id": 21990,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651710539.920, "dur": 23.640, "args": { "External id": 21991,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710544.706, "dur": 2.095, "args": { "External id": 21992,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710548.725, "dur": 0.311, "args": { "External id": 21993,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710550.362, "dur": 0.275, "args": { "External id": 21994,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710551.797, "dur": 0.411, "args": { "External id": 21995,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710554.328, "dur": 0.380, "args": { "External id": 21996,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710555.505, "dur": 0.184, "args": { "External id": 21997,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710556.734, "dur": 0.758, "args": { "External id": 21998,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710558.735, "dur": 0.375, "args": { "External id": 21999,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710559.690, "dur": 0.173, "args": { "External id": 22000,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651710572.534, "dur": 27.001, "args": { "External id": 22001,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4592 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651710628.198, "dur": 111.475, "args": { "External id": 22002,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651710637.812, "dur": 2.965, "args": { "External id": 22003,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651710645.350, "dur": 10.701, "args": { "External id": 22004,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651710649.440, "dur": 6.207, "args": { "External id": 22005,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710653.300, "dur": 0.610, "args": { "External id": 22006,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651710662.209, "dur": 21.069, "args": { "External id": 22007,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710664.407, "dur": 0.878, "args": { "External id": 22008,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710666.425, "dur": 0.711, "args": { "External id": 22009,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710668.236, "dur": 0.531, "args": { "External id": 22010,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710670.220, "dur": 0.416, "args": { "External id": 22011,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710671.705, "dur": 0.300, "args": { "External id": 22012,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710673.356, "dur": 0.589, "args": { "External id": 22013,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710674.973, "dur": 0.296, "args": { "External id": 22014,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710676.029, "dur": 0.398, "args": { "External id": 22015,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651710677.353, "dur": 0.841, "args": { "External id": 22016,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651710715.563, "dur": 16.891, "args": { "External id": 22017,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4608 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651710782.626, "dur": 108.068, "args": { "External id": 22018,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4609 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651710809.111, "dur": 78.422, "args": { "External id": 22019,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4610, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651710817.900, "dur": 65.792, "args": { "External id": 22020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4611 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651710907.685, "dur": 1.921, "args": { "External id": 22021,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4612, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651710979.807, "dur": 1621.814, "args": { "External id": 22022,"Sequence number": 246556, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4613 } }, { "ph": "f", "id": 212, "pid": 1336757, "tid": 1381170, "ts": 1295651710979.807, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651711140.451, "dur": 119.578, "args": { "External id": 22023,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4614 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651711301.655, "dur": 40.614, "args": { "External id": 22024,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651711358.132, "dur": 51.446, "args": { "External id": 22025,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651711419.333, "dur": 32.770, "args": { "External id": 22026,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651711462.590, "dur": 45.108, "args": { "External id": 22027,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651711514.682, "dur": 27.591, "args": { "External id": 22028,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651711548.357, "dur": 43.073, "args": { "External id": 22029,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4620 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651711616.766, "dur": 21.581, "args": { "External id": 22030,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4621 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651711655.352, "dur": 28.593, "args": { "External id": 22031,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4622 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651711705.697, "dur": 19.815, "args": { "External id": 22032,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4623 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651711737.970, "dur": 15.652, "args": { "External id": 22033,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651711761.092, "dur": 30.093, "args": { "External id": 22034,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651711794.263, "dur": 31.639, "args": { "External id": 22035,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4626 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651711851.242, "dur": 197.053, "args": { "External id": 22036,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651711921.585, "dur": 5.770, "args": { "External id": 22037,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651711929.121, "dur": 1.972, "args": { "External id": 22038,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4629 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651712084.962, "dur": 26.099, "args": { "External id": 22039,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4630 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651712124.429, "dur": 15.110, "args": { "External id": 22040,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651712147.778, "dur": 40.286, "args": { "External id": 22041,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651712194.056, "dur": 33.618, "args": { "External id": 22042,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651712249.646, "dur": 25.985, "args": { "External id": 22043,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651712280.057, "dur": 29.907, "args": { "External id": 22044,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651712315.050, "dur": 21.304, "args": { "External id": 22045,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651712342.635, "dur": 28.891, "args": { "External id": 22046,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4637 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651712391.230, "dur": 22.950, "args": { "External id": 22047,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4638 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651712432.247, "dur": 22.927, "args": { "External id": 22048,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4639 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651712478.980, "dur": 26.215, "args": { "External id": 22049,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4640 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651712524.959, "dur": 15.162, "args": { "External id": 22050,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4641 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651712555.754, "dur": 15.945, "args": { "External id": 22051,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4642 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712645.574, "dur": 14.486, "args": { "External id": 22052,"Record function id": 0, "Ev Idx": 4643 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712648.436, "dur": 10.774, "args": { "External id": 22053,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712652.337, "dur": 5.952, "args": { "External id": 22054,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4645 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712653.930, "dur": 4.258, "args": { "External id": 22055,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4646 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712664.035, "dur": 5.107, "args": { "External id": 22056,"Record function id": 0, "Ev Idx": 4647 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712665.409, "dur": 3.249, "args": { "External id": 22057,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712666.364, "dur": 1.833, "args": { "External id": 22058,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4649 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712667.338, "dur": 0.788, "args": { "External id": 22059,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4650 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712672.469, "dur": 4.341, "args": { "External id": 22060,"Record function id": 0, "Ev Idx": 4651 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712673.709, "dur": 2.632, "args": { "External id": 22061,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712674.392, "dur": 1.497, "args": { "External id": 22062,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4653 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712674.917, "dur": 0.886, "args": { "External id": 22063,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4654 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712680.051, "dur": 3.734, "args": { "External id": 22064,"Record function id": 0, "Ev Idx": 4655 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712681.249, "dur": 2.105, "args": { "External id": 22065,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712681.816, "dur": 1.091, "args": { "External id": 22066,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4657 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712682.170, "dur": 0.648, "args": { "External id": 22067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4658 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712687.079, "dur": 3.271, "args": { "External id": 22068,"Record function id": 0, "Ev Idx": 4659 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712688.150, "dur": 1.770, "args": { "External id": 22069,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712688.669, "dur": 0.824, "args": { "External id": 22070,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4661 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712688.964, "dur": 0.465, "args": { "External id": 22071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4662 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712693.483, "dur": 4.365, "args": { "External id": 22072,"Record function id": 0, "Ev Idx": 4663 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712694.708, "dur": 2.737, "args": { "External id": 22073,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712695.356, "dur": 1.658, "args": { "External id": 22074,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4665 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712696.032, "dur": 0.909, "args": { "External id": 22075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4666 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712701.042, "dur": 3.614, "args": { "External id": 22076,"Record function id": 0, "Ev Idx": 4667 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712702.004, "dur": 2.238, "args": { "External id": 22077,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712702.689, "dur": 1.102, "args": { "External id": 22078,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4669 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712703.267, "dur": 0.458, "args": { "External id": 22079,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4670 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712707.869, "dur": 3.897, "args": { "External id": 22080,"Record function id": 0, "Ev Idx": 4671 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712708.861, "dur": 2.506, "args": { "External id": 22081,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712709.729, "dur": 1.243, "args": { "External id": 22082,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4673 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712710.011, "dur": 0.894, "args": { "External id": 22083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4674 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712714.818, "dur": 4.935, "args": { "External id": 22084,"Record function id": 0, "Ev Idx": 4675 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651712716.052, "dur": 3.266, "args": { "External id": 22085,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712716.527, "dur": 2.370, "args": { "External id": 22086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4677 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651712718.335, "dur": 0.469, "args": { "External id": 22087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4678 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651712723.378, "dur": 36570.744, "args": { "External id": 22088,"Record function id": 0, "Sequence number": 246555, "Fwd thread id": 1, "Ev Idx": 4679 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651712724.646, "dur": 36560.476, "args": { "External id": 22089,"Sequence number": 246555, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4680 } }, { "ph": "f", "id": 213, "pid": 1336757, "tid": 1381170, "ts": 1295651712724.646, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.7)", "pid": 1336757, "tid": 1381170, "ts": 1295651712751.395, "dur": 34.233, "args": { "External id": 22090,"Record function id": 0, "Ev Idx": 4681 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.7)", "pid": 1336757, "tid": 1381170, "ts": 1295651712792.982, "dur": 58.193, "args": { "External id": 22091,"Record function id": 0, "Ev Idx": 4682 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.7)", "pid": 1336757, "tid": 1381170, "ts": 1295651712856.987, "dur": 36419.874, "args": { "External id": 22092,"Record function id": 0, "Ev Idx": 4683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651712940.284, "dur": 6.622, "args": { "External id": 22093,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651712955.869, "dur": 4.837, "args": { "External id": 22094,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4685 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651712974.209, "dur": 35522.888, "args": { "External id": 22095,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651713025.735, "dur": 35462.750, "args": { "External id": 22096,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651713070.208, "dur": 15.095, "args": { "External id": 22097,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651713091.494, "dur": 35357.875, "args": { "External id": 22098,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651713093.646, "dur": 35355.163, "args": { "External id": 22099,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651713097.850, "dur": 6.392, "args": { "External id": 22100,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651713107.304, "dur": 35338.243, "args": { "External id": 22101,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651748582.952, "dur": 9.287, "args": { "External id": 22102,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651748585.542, "dur": 6.338, "args": { "External id": 22103,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4694 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651748620.648, "dur": 339.132, "args": { "External id": 22104,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4695 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651748649.147, "dur": 306.150, "args": { "External id": 22105,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4696, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651748659.378, "dur": 291.027, "args": { "External id": 22106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4697 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651748976.409, "dur": 2.522, "args": { "External id": 22107,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4698, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749068.451, "dur": 6.434, "args": { "External id": 22108,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749118.443, "dur": 1.500, "args": { "External id": 22109,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749135.048, "dur": 1.367, "args": { "External id": 22110,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749147.681, "dur": 0.901, "args": { "External id": 22111,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749159.270, "dur": 0.817, "args": { "External id": 22112,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749170.076, "dur": 1.324, "args": { "External id": 22113,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749183.235, "dur": 0.880, "args": { "External id": 22114,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749193.788, "dur": 1.024, "args": { "External id": 22115,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749204.391, "dur": 0.687, "args": { "External id": 22116,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4707 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651749309.787, "dur": 2548.094, "args": { "External id": 22117,"Record function id": 0, "Ev Idx": 4708 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.6)", "pid": 1336757, "tid": 1381170, "ts": 1295651749328.063, "dur": 953.390, "args": { "External id": 22118,"Record function id": 0, "Ev Idx": 4709 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.6)", "pid": 1336757, "tid": 1381170, "ts": 1295651749341.166, "dur": 295.384, "args": { "External id": 22119,"Record function id": 0, "Ev Idx": 4710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651749415.728, "dur": 4.852, "args": { "External id": 22120,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651749423.759, "dur": 1.527, "args": { "External id": 22121,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651749428.714, "dur": 0.903, "args": { "External id": 22122,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651749430.958, "dur": 1.400, "args": { "External id": 22123,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651749433.702, "dur": 0.865, "args": { "External id": 22124,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651749435.832, "dur": 1.298, "args": { "External id": 22125,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651749440.595, "dur": 0.869, "args": { "External id": 22126,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651749442.651, "dur": 0.816, "args": { "External id": 22127,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651749444.973, "dur": 0.538, "args": { "External id": 22128,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651749446.894, "dur": 1.093, "args": { "External id": 22129,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4720 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651749465.781, "dur": 143.892, "args": { "External id": 22130,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651749480.809, "dur": 124.336, "args": { "External id": 22131,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651749495.749, "dur": 11.575, "args": { "External id": 22132,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651749510.350, "dur": 65.054, "args": { "External id": 22133,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651749512.800, "dur": 62.217, "args": { "External id": 22134,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749518.747, "dur": 4.664, "args": { "External id": 22135,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651749525.566, "dur": 48.870, "args": { "External id": 22136,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4727 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.5", "pid": 1336757, "tid": 1381170, "ts": 1295651749711.101, "dur": 562.251, "args": { "External id": 22137,"Record function id": 0, "Ev Idx": 4728 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.5)", "pid": 1336757, "tid": 1381170, "ts": 1295651749725.659, "dur": 534.619, "args": { "External id": 22138,"Record function id": 0, "Ev Idx": 4729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651749777.527, "dur": 4.520, "args": { "External id": 22139,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651749797.063, "dur": 21.527, "args": { "External id": 22140,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749801.444, "dur": 1.631, "args": { "External id": 22141,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749804.576, "dur": 0.302, "args": { "External id": 22142,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749806.058, "dur": 0.472, "args": { "External id": 22143,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749807.791, "dur": 0.406, "args": { "External id": 22144,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749809.777, "dur": 0.400, "args": { "External id": 22145,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749811.205, "dur": 0.232, "args": { "External id": 22146,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749812.378, "dur": 0.282, "args": { "External id": 22147,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749814.438, "dur": 0.309, "args": { "External id": 22148,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749815.378, "dur": 0.198, "args": { "External id": 22149,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651749828.071, "dur": 26.907, "args": { "External id": 22150,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4741 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651749881.815, "dur": 93.212, "args": { "External id": 22151,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651749890.266, "dur": 3.013, "args": { "External id": 22152,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651749897.959, "dur": 9.619, "args": { "External id": 22153,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651749902.104, "dur": 5.086, "args": { "External id": 22154,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749905.292, "dur": 0.681, "args": { "External id": 22155,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651749913.669, "dur": 22.337, "args": { "External id": 22156,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749915.371, "dur": 0.366, "args": { "External id": 22157,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749916.826, "dur": 0.607, "args": { "External id": 22158,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749921.319, "dur": 0.265, "args": { "External id": 22159,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749922.795, "dur": 0.305, "args": { "External id": 22160,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749924.346, "dur": 0.709, "args": { "External id": 22161,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749926.233, "dur": 0.466, "args": { "External id": 22162,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749927.279, "dur": 0.220, "args": { "External id": 22163,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749928.544, "dur": 0.554, "args": { "External id": 22164,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651749930.493, "dur": 0.292, "args": { "External id": 22165,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651749949.895, "dur": 18.068, "args": { "External id": 22166,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4757 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651750071.282, "dur": 107.941, "args": { "External id": 22167,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4758 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651750096.272, "dur": 79.638, "args": { "External id": 22168,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4759, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651750106.180, "dur": 65.703, "args": { "External id": 22169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4760 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651750192.696, "dur": 1.669, "args": { "External id": 22170,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4761, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651750289.430, "dur": 1544.445, "args": { "External id": 22171,"Sequence number": 246554, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4762 } }, { "ph": "f", "id": 214, "pid": 1336757, "tid": 1381170, "ts": 1295651750289.430, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651750395.508, "dur": 104.139, "args": { "External id": 22172,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4763 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651750534.769, "dur": 40.847, "args": { "External id": 22173,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651750590.910, "dur": 47.547, "args": { "External id": 22174,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651750648.230, "dur": 32.991, "args": { "External id": 22175,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651750687.965, "dur": 45.283, "args": { "External id": 22176,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651750739.957, "dur": 27.513, "args": { "External id": 22177,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651750774.077, "dur": 40.983, "args": { "External id": 22178,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4769 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651750836.291, "dur": 23.495, "args": { "External id": 22179,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4770 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651750876.798, "dur": 27.301, "args": { "External id": 22180,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4771 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651750923.127, "dur": 20.156, "args": { "External id": 22181,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4772 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651750956.872, "dur": 16.126, "args": { "External id": 22182,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651750981.043, "dur": 74.083, "args": { "External id": 22183,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651751060.662, "dur": 36.809, "args": { "External id": 22184,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4775 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651751128.104, "dur": 184.983, "args": { "External id": 22185,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651751206.590, "dur": 6.715, "args": { "External id": 22186,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651751215.120, "dur": 1.856, "args": { "External id": 22187,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4778 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651751346.402, "dur": 24.564, "args": { "External id": 22188,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4779 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651751382.308, "dur": 14.481, "args": { "External id": 22189,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651751404.651, "dur": 39.061, "args": { "External id": 22190,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651751449.646, "dur": 34.942, "args": { "External id": 22191,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651751491.023, "dur": 21.759, "args": { "External id": 22192,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651751517.476, "dur": 28.753, "args": { "External id": 22193,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651751551.441, "dur": 21.481, "args": { "External id": 22194,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651751578.407, "dur": 30.078, "args": { "External id": 22195,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4786 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651751626.734, "dur": 23.798, "args": { "External id": 22196,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4787 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651751666.948, "dur": 23.559, "args": { "External id": 22197,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4788 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651751705.462, "dur": 17.426, "args": { "External id": 22198,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4789 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651751752.241, "dur": 22.145, "args": { "External id": 22199,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4790 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651751789.804, "dur": 17.347, "args": { "External id": 22200,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4791 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751878.908, "dur": 14.818, "args": { "External id": 22201,"Record function id": 0, "Ev Idx": 4792 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751882.168, "dur": 10.598, "args": { "External id": 22202,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751886.056, "dur": 5.826, "args": { "External id": 22203,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4794 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751887.242, "dur": 4.477, "args": { "External id": 22204,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4795 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751897.746, "dur": 4.539, "args": { "External id": 22205,"Record function id": 0, "Ev Idx": 4796 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751899.227, "dur": 2.551, "args": { "External id": 22206,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751900.059, "dur": 1.230, "args": { "External id": 22207,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4798 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751900.459, "dur": 0.726, "args": { "External id": 22208,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4799 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751905.695, "dur": 4.571, "args": { "External id": 22209,"Record function id": 0, "Ev Idx": 4800 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751907.086, "dur": 2.745, "args": { "External id": 22210,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751907.920, "dur": 1.452, "args": { "External id": 22211,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4802 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751908.592, "dur": 0.697, "args": { "External id": 22212,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4803 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751916.929, "dur": 3.855, "args": { "External id": 22213,"Record function id": 0, "Ev Idx": 4804 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751918.050, "dur": 2.298, "args": { "External id": 22214,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751918.861, "dur": 1.068, "args": { "External id": 22215,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4806 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751919.373, "dur": 0.482, "args": { "External id": 22216,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4807 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751923.871, "dur": 3.525, "args": { "External id": 22217,"Record function id": 0, "Ev Idx": 4808 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751924.925, "dur": 2.057, "args": { "External id": 22218,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751925.485, "dur": 1.052, "args": { "External id": 22219,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4810 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751925.889, "dur": 0.582, "args": { "External id": 22220,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4811 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751930.509, "dur": 3.565, "args": { "External id": 22221,"Record function id": 0, "Ev Idx": 4812 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751931.457, "dur": 2.212, "args": { "External id": 22222,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751932.062, "dur": 1.206, "args": { "External id": 22223,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4814 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751932.394, "dur": 0.811, "args": { "External id": 22224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4815 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751937.252, "dur": 5.395, "args": { "External id": 22225,"Record function id": 0, "Ev Idx": 4816 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751938.456, "dur": 3.778, "args": { "External id": 22226,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751938.955, "dur": 2.882, "args": { "External id": 22227,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4818 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751940.637, "dur": 1.099, "args": { "External id": 22228,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4819 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751945.789, "dur": 3.601, "args": { "External id": 22229,"Record function id": 0, "Ev Idx": 4820 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751946.947, "dur": 2.005, "args": { "External id": 22230,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751947.434, "dur": 1.121, "args": { "External id": 22231,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4822 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751947.718, "dur": 0.744, "args": { "External id": 22232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4823 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751952.499, "dur": 3.790, "args": { "External id": 22233,"Record function id": 0, "Ev Idx": 4824 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651751953.706, "dur": 2.176, "args": { "External id": 22234,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751954.414, "dur": 1.070, "args": { "External id": 22235,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4826 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651751954.687, "dur": 0.730, "args": { "External id": 22236,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4827 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651751959.783, "dur": 37482.933, "args": { "External id": 22237,"Record function id": 0, "Sequence number": 246553, "Fwd thread id": 1, "Ev Idx": 4828 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651751960.894, "dur": 37473.517, "args": { "External id": 22238,"Sequence number": 246553, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4829 } }, { "ph": "f", "id": 215, "pid": 1336757, "tid": 1381170, "ts": 1295651751960.894, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.6)", "pid": 1336757, "tid": 1381170, "ts": 1295651752023.845, "dur": 38.265, "args": { "External id": 22239,"Record function id": 0, "Ev Idx": 4830 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.6)", "pid": 1336757, "tid": 1381170, "ts": 1295651752069.880, "dur": 57.787, "args": { "External id": 22240,"Record function id": 0, "Ev Idx": 4831 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.6)", "pid": 1336757, "tid": 1381170, "ts": 1295651752133.574, "dur": 37292.617, "args": { "External id": 22241,"Record function id": 0, "Ev Idx": 4832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651752219.214, "dur": 7.311, "args": { "External id": 22242,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651752251.163, "dur": 5.213, "args": { "External id": 22243,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4834 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651752273.557, "dur": 36359.672, "args": { "External id": 22244,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651752286.760, "dur": 36338.107, "args": { "External id": 22245,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651752332.457, "dur": 14.734, "args": { "External id": 22246,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651752353.124, "dur": 36231.521, "args": { "External id": 22247,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651752355.588, "dur": 36228.378, "args": { "External id": 22248,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651752359.749, "dur": 6.084, "args": { "External id": 22249,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651752367.513, "dur": 36212.887, "args": { "External id": 22250,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651788719.733, "dur": 9.474, "args": { "External id": 22251,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651788722.710, "dur": 6.186, "args": { "External id": 22252,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4843 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651788755.189, "dur": 376.552, "args": { "External id": 22253,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4844 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651788784.304, "dur": 342.665, "args": { "External id": 22254,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4845, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651788794.762, "dur": 326.693, "args": { "External id": 22255,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4846 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651789153.340, "dur": 2.260, "args": { "External id": 22256,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4847, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789211.200, "dur": 6.551, "args": { "External id": 22257,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789274.969, "dur": 2.096, "args": { "External id": 22258,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789293.507, "dur": 1.896, "args": { "External id": 22259,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789306.492, "dur": 0.981, "args": { "External id": 22260,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789318.586, "dur": 0.985, "args": { "External id": 22261,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789329.236, "dur": 1.011, "args": { "External id": 22262,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789340.507, "dur": 0.718, "args": { "External id": 22263,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789352.722, "dur": 1.743, "args": { "External id": 22264,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789366.015, "dur": 1.024, "args": { "External id": 22265,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4856 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651789457.136, "dur": 2492.975, "args": { "External id": 22266,"Record function id": 0, "Ev Idx": 4857 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.5)", "pid": 1336757, "tid": 1381170, "ts": 1295651789475.608, "dur": 952.462, "args": { "External id": 22267,"Record function id": 0, "Ev Idx": 4858 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.5)", "pid": 1336757, "tid": 1381170, "ts": 1295651789488.950, "dur": 292.948, "args": { "External id": 22268,"Record function id": 0, "Ev Idx": 4859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651789565.235, "dur": 4.468, "args": { "External id": 22269,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651789572.967, "dur": 1.402, "args": { "External id": 22270,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651789576.248, "dur": 1.074, "args": { "External id": 22271,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651789578.709, "dur": 0.811, "args": { "External id": 22272,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651789582.069, "dur": 1.558, "args": { "External id": 22273,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651789584.836, "dur": 0.863, "args": { "External id": 22274,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651789587.187, "dur": 0.888, "args": { "External id": 22275,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651789589.229, "dur": 1.396, "args": { "External id": 22276,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651789593.113, "dur": 1.036, "args": { "External id": 22277,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651789595.582, "dur": 1.520, "args": { "External id": 22278,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4869 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651789614.160, "dur": 141.044, "args": { "External id": 22279,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651789628.669, "dur": 122.461, "args": { "External id": 22280,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651789643.738, "dur": 12.284, "args": { "External id": 22281,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651789658.988, "dur": 64.137, "args": { "External id": 22282,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651789661.591, "dur": 61.230, "args": { "External id": 22283,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789665.370, "dur": 5.564, "args": { "External id": 22284,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651789672.553, "dur": 49.674, "args": { "External id": 22285,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4876 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.4", "pid": 1336757, "tid": 1381170, "ts": 1295651789857.043, "dur": 563.452, "args": { "External id": 22286,"Record function id": 0, "Ev Idx": 4877 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.4)", "pid": 1336757, "tid": 1381170, "ts": 1295651789870.690, "dur": 537.415, "args": { "External id": 22287,"Record function id": 0, "Ev Idx": 4878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651789923.707, "dur": 4.738, "args": { "External id": 22288,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651789943.818, "dur": 21.869, "args": { "External id": 22289,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789947.755, "dur": 1.643, "args": { "External id": 22290,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789951.047, "dur": 0.261, "args": { "External id": 22291,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789953.227, "dur": 0.368, "args": { "External id": 22292,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789955.053, "dur": 0.351, "args": { "External id": 22293,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789956.051, "dur": 0.195, "args": { "External id": 22294,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789957.451, "dur": 0.728, "args": { "External id": 22295,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789959.166, "dur": 0.501, "args": { "External id": 22296,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789960.539, "dur": 0.362, "args": { "External id": 22297,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651789961.855, "dur": 0.910, "args": { "External id": 22298,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651789975.350, "dur": 70.341, "args": { "External id": 22299,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4890 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651790079.027, "dur": 90.884, "args": { "External id": 22300,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651790089.559, "dur": 4.320, "args": { "External id": 22301,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651790099.122, "dur": 10.369, "args": { "External id": 22302,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651790103.341, "dur": 5.733, "args": { "External id": 22303,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651790106.650, "dur": 0.725, "args": { "External id": 22304,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651790116.292, "dur": 19.795, "args": { "External id": 22305,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651790117.669, "dur": 0.925, "args": { "External id": 22306,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651790120.039, "dur": 0.461, "args": { "External id": 22307,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651790121.450, "dur": 0.480, "args": { "External id": 22308,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651790122.732, "dur": 0.551, "args": { "External id": 22309,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651790124.339, "dur": 0.479, "args": { "External id": 22310,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651790125.585, "dur": 0.407, "args": { "External id": 22311,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651790126.967, "dur": 0.634, "args": { "External id": 22312,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651790129.018, "dur": 0.334, "args": { "External id": 22313,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651790129.919, "dur": 0.728, "args": { "External id": 22314,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651790144.594, "dur": 17.975, "args": { "External id": 22315,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4906 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651790213.657, "dur": 125.156, "args": { "External id": 22316,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4907 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651790252.286, "dur": 82.903, "args": { "External id": 22317,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4908, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651790262.380, "dur": 69.115, "args": { "External id": 22318,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4909 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651790356.165, "dur": 1.787, "args": { "External id": 22319,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4910, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651790434.448, "dur": 1496.913, "args": { "External id": 22320,"Sequence number": 246552, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4911 } }, { "ph": "f", "id": 216, "pid": 1336757, "tid": 1381170, "ts": 1295651790434.448, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651790540.941, "dur": 99.761, "args": { "External id": 22321,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4912 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651790677.406, "dur": 38.206, "args": { "External id": 22322,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651790729.847, "dur": 45.975, "args": { "External id": 22323,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651790784.723, "dur": 32.204, "args": { "External id": 22324,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651790823.000, "dur": 45.066, "args": { "External id": 22325,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651790874.552, "dur": 27.038, "args": { "External id": 22326,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651790908.549, "dur": 41.619, "args": { "External id": 22327,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4918 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651790972.424, "dur": 63.407, "args": { "External id": 22328,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4919 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651791055.899, "dur": 29.808, "args": { "External id": 22329,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4920 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651791108.265, "dur": 20.446, "args": { "External id": 22330,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4921 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651791141.160, "dur": 15.773, "args": { "External id": 22331,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651791164.910, "dur": 33.901, "args": { "External id": 22332,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651791202.053, "dur": 48.871, "args": { "External id": 22333,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4924 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651791279.592, "dur": 163.519, "args": { "External id": 22334,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651791353.387, "dur": 5.908, "args": { "External id": 22335,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651791361.106, "dur": 1.930, "args": { "External id": 22336,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4927 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651791476.113, "dur": 24.755, "args": { "External id": 22337,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4928 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651791514.725, "dur": 15.474, "args": { "External id": 22338,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651791537.891, "dur": 38.434, "args": { "External id": 22339,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651791581.506, "dur": 34.089, "args": { "External id": 22340,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651791621.627, "dur": 21.416, "args": { "External id": 22341,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651791647.466, "dur": 29.592, "args": { "External id": 22342,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651791681.861, "dur": 20.894, "args": { "External id": 22343,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651791708.542, "dur": 28.636, "args": { "External id": 22344,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4935 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651791753.447, "dur": 23.340, "args": { "External id": 22345,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4936 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651791795.101, "dur": 24.627, "args": { "External id": 22346,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4937 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651791833.693, "dur": 17.918, "args": { "External id": 22347,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4938 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651791865.479, "dur": 14.687, "args": { "External id": 22348,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4939 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651791890.963, "dur": 15.535, "args": { "External id": 22349,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4940 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651791981.036, "dur": 57.433, "args": { "External id": 22350,"Record function id": 0, "Ev Idx": 4941 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792022.290, "dur": 14.315, "args": { "External id": 22351,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792026.947, "dur": 7.107, "args": { "External id": 22352,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4943 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792028.524, "dur": 5.073, "args": { "External id": 22353,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4944 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792045.946, "dur": 5.140, "args": { "External id": 22354,"Record function id": 0, "Ev Idx": 4945 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792047.793, "dur": 2.903, "args": { "External id": 22355,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792048.623, "dur": 1.541, "args": { "External id": 22356,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4947 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792049.293, "dur": 0.800, "args": { "External id": 22357,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4948 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792054.345, "dur": 4.171, "args": { "External id": 22358,"Record function id": 0, "Ev Idx": 4949 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792055.676, "dur": 2.362, "args": { "External id": 22359,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792056.196, "dur": 1.363, "args": { "External id": 22360,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4951 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792056.983, "dur": 0.462, "args": { "External id": 22361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4952 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792061.720, "dur": 3.302, "args": { "External id": 22362,"Record function id": 0, "Ev Idx": 4953 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792062.809, "dur": 1.801, "args": { "External id": 22363,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792063.331, "dur": 0.862, "args": { "External id": 22364,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4955 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792063.616, "dur": 0.485, "args": { "External id": 22365,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4956 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792068.151, "dur": 3.757, "args": { "External id": 22366,"Record function id": 0, "Ev Idx": 4957 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792069.197, "dur": 2.286, "args": { "External id": 22367,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792069.700, "dur": 1.322, "args": { "External id": 22368,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4959 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792069.965, "dur": 0.990, "args": { "External id": 22369,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4960 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792075.105, "dur": 4.216, "args": { "External id": 22370,"Record function id": 0, "Ev Idx": 4961 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792076.340, "dur": 2.541, "args": { "External id": 22371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792077.133, "dur": 1.335, "args": { "External id": 22372,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4963 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792077.675, "dur": 0.728, "args": { "External id": 22373,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4964 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792082.641, "dur": 5.173, "args": { "External id": 22374,"Record function id": 0, "Ev Idx": 4965 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792083.864, "dur": 3.541, "args": { "External id": 22375,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792084.473, "dur": 2.531, "args": { "External id": 22376,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4967 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792085.939, "dur": 0.975, "args": { "External id": 22377,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4968 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792090.942, "dur": 3.490, "args": { "External id": 22378,"Record function id": 0, "Ev Idx": 4969 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792092.001, "dur": 1.987, "args": { "External id": 22379,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792092.461, "dur": 1.125, "args": { "External id": 22380,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4971 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792093.063, "dur": 0.457, "args": { "External id": 22381,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4972 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792097.471, "dur": 2.985, "args": { "External id": 22382,"Record function id": 0, "Ev Idx": 4973 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651792098.328, "dur": 1.723, "args": { "External id": 22383,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792098.849, "dur": 0.768, "args": { "External id": 22384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4975 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651792099.122, "dur": 0.427, "args": { "External id": 22385,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4976 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651792104.041, "dur": 38153.431, "args": { "External id": 22386,"Record function id": 0, "Sequence number": 246551, "Fwd thread id": 1, "Ev Idx": 4977 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651792105.240, "dur": 38141.904, "args": { "External id": 22387,"Sequence number": 246551, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4978 } }, { "ph": "f", "id": 217, "pid": 1336757, "tid": 1381170, "ts": 1295651792105.240, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.5)", "pid": 1336757, "tid": 1381170, "ts": 1295651792140.449, "dur": 37.258, "args": { "External id": 22388,"Record function id": 0, "Ev Idx": 4979 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.5)", "pid": 1336757, "tid": 1381170, "ts": 1295651792185.169, "dur": 82.506, "args": { "External id": 22389,"Record function id": 0, "Ev Idx": 4980 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.5)", "pid": 1336757, "tid": 1381170, "ts": 1295651792274.965, "dur": 37950.060, "args": { "External id": 22390,"Record function id": 0, "Ev Idx": 4981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651792365.123, "dur": 7.202, "args": { "External id": 22391,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651792382.211, "dur": 4.780, "args": { "External id": 22392,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4983 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651792405.283, "dur": 36993.126, "args": { "External id": 22393,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651792418.036, "dur": 36971.357, "args": { "External id": 22394,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651792464.893, "dur": 14.317, "args": { "External id": 22395,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651792484.943, "dur": 36866.021, "args": { "External id": 22396,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651792487.492, "dur": 36862.784, "args": { "External id": 22397,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651792490.888, "dur": 4.953, "args": { "External id": 22398,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651792497.344, "dur": 36848.753, "args": { "External id": 22399,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651829490.127, "dur": 9.859, "args": { "External id": 22400,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651829493.047, "dur": 6.588, "args": { "External id": 22401,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4992 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651829527.352, "dur": 379.854, "args": { "External id": 22402,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4993 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651829554.712, "dur": 348.058, "args": { "External id": 22403,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4994, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651829565.395, "dur": 332.293, "args": { "External id": 22404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4995 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651829927.012, "dur": 2.331, "args": { "External id": 22405,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4996, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830027.383, "dur": 7.173, "args": { "External id": 22406,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830080.803, "dur": 1.770, "args": { "External id": 22407,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830097.994, "dur": 1.377, "args": { "External id": 22408,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830110.697, "dur": 1.000, "args": { "External id": 22409,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830123.338, "dur": 0.937, "args": { "External id": 22410,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830134.164, "dur": 0.997, "args": { "External id": 22411,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830144.396, "dur": 0.826, "args": { "External id": 22412,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830154.727, "dur": 1.449, "args": { "External id": 22413,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830164.819, "dur": 1.147, "args": { "External id": 22414,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5005 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651830273.310, "dur": 2470.759, "args": { "External id": 22415,"Record function id": 0, "Ev Idx": 5006 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.4)", "pid": 1336757, "tid": 1381170, "ts": 1295651830293.295, "dur": 904.762, "args": { "External id": 22416,"Record function id": 0, "Ev Idx": 5007 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.4)", "pid": 1336757, "tid": 1381170, "ts": 1295651830305.906, "dur": 289.205, "args": { "External id": 22417,"Record function id": 0, "Ev Idx": 5008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651830379.815, "dur": 4.705, "args": { "External id": 22418,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651830389.127, "dur": 1.122, "args": { "External id": 22419,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651830392.037, "dur": 1.274, "args": { "External id": 22420,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651830394.781, "dur": 1.136, "args": { "External id": 22421,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651830397.373, "dur": 0.878, "args": { "External id": 22422,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651830400.772, "dur": 1.303, "args": { "External id": 22423,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651830403.546, "dur": 0.774, "args": { "External id": 22424,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651830405.485, "dur": 1.210, "args": { "External id": 22425,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651830408.248, "dur": 1.229, "args": { "External id": 22426,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651830411.846, "dur": 0.972, "args": { "External id": 22427,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5018 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651830429.184, "dur": 139.147, "args": { "External id": 22428,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651830444.428, "dur": 119.519, "args": { "External id": 22429,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651830459.226, "dur": 12.228, "args": { "External id": 22430,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651830474.561, "dur": 61.466, "args": { "External id": 22431,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651830477.031, "dur": 58.710, "args": { "External id": 22432,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830480.386, "dur": 4.691, "args": { "External id": 22433,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651830486.837, "dur": 48.316, "args": { "External id": 22434,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5025 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.3", "pid": 1336757, "tid": 1381170, "ts": 1295651830668.378, "dur": 522.849, "args": { "External id": 22435,"Record function id": 0, "Ev Idx": 5026 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.3)", "pid": 1336757, "tid": 1381170, "ts": 1295651830682.542, "dur": 496.545, "args": { "External id": 22436,"Record function id": 0, "Ev Idx": 5027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651830737.003, "dur": 4.418, "args": { "External id": 22437,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651830756.434, "dur": 21.859, "args": { "External id": 22438,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830760.991, "dur": 1.424, "args": { "External id": 22439,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830764.377, "dur": 0.331, "args": { "External id": 22440,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830765.729, "dur": 0.424, "args": { "External id": 22441,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830767.716, "dur": 0.650, "args": { "External id": 22442,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830769.799, "dur": 0.249, "args": { "External id": 22443,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830770.795, "dur": 0.166, "args": { "External id": 22444,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830771.753, "dur": 0.889, "args": { "External id": 22445,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830773.588, "dur": 0.586, "args": { "External id": 22446,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830775.101, "dur": 0.236, "args": { "External id": 22447,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651830787.913, "dur": 26.932, "args": { "External id": 22448,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5039 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651830842.198, "dur": 83.028, "args": { "External id": 22449,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651830851.123, "dur": 2.629, "args": { "External id": 22450,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651830858.430, "dur": 10.099, "args": { "External id": 22451,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651830862.495, "dur": 5.622, "args": { "External id": 22452,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830865.791, "dur": 0.772, "args": { "External id": 22453,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651830874.941, "dur": 19.372, "args": { "External id": 22454,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830876.888, "dur": 0.354, "args": { "External id": 22455,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830878.664, "dur": 0.330, "args": { "External id": 22456,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830880.510, "dur": 0.664, "args": { "External id": 22457,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830882.377, "dur": 0.383, "args": { "External id": 22458,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830883.502, "dur": 0.586, "args": { "External id": 22459,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830884.711, "dur": 0.754, "args": { "External id": 22460,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830886.927, "dur": 0.631, "args": { "External id": 22461,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830888.417, "dur": 0.281, "args": { "External id": 22462,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651830889.660, "dur": 0.535, "args": { "External id": 22463,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651830901.956, "dur": 16.250, "args": { "External id": 22464,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5055 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651830965.416, "dur": 145.669, "args": { "External id": 22465,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5056 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651831026.341, "dur": 81.115, "args": { "External id": 22466,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5057, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651831036.594, "dur": 66.967, "args": { "External id": 22467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5058 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651831127.166, "dur": 1.884, "args": { "External id": 22468,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5059, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651831204.439, "dur": 1517.806, "args": { "External id": 22469,"Sequence number": 246550, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5060 } }, { "ph": "f", "id": 218, "pid": 1336757, "tid": 1381170, "ts": 1295651831204.439, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651831326.014, "dur": 102.599, "args": { "External id": 22470,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5061 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651831464.842, "dur": 40.032, "args": { "External id": 22471,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651831519.800, "dur": 48.180, "args": { "External id": 22472,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651831577.637, "dur": 34.196, "args": { "External id": 22473,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651831617.720, "dur": 44.394, "args": { "External id": 22474,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651831667.945, "dur": 28.340, "args": { "External id": 22475,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651831702.095, "dur": 42.061, "args": { "External id": 22476,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5067 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651831765.385, "dur": 24.237, "args": { "External id": 22477,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5068 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651831805.760, "dur": 24.375, "args": { "External id": 22478,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5069 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651831850.773, "dur": 19.390, "args": { "External id": 22479,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5070 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651831881.711, "dur": 14.224, "args": { "External id": 22480,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651831903.344, "dur": 28.893, "args": { "External id": 22481,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651831934.989, "dur": 31.745, "args": { "External id": 22482,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5073 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651832029.272, "dur": 168.122, "args": { "External id": 22483,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651832105.213, "dur": 7.112, "args": { "External id": 22484,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651832114.463, "dur": 2.109, "args": { "External id": 22485,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5076 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651832243.490, "dur": 26.972, "args": { "External id": 22486,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5077 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651832284.561, "dur": 15.211, "args": { "External id": 22487,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651832309.092, "dur": 41.291, "args": { "External id": 22488,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651832356.289, "dur": 34.312, "args": { "External id": 22489,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651832397.471, "dur": 22.119, "args": { "External id": 22490,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651832423.875, "dur": 29.102, "args": { "External id": 22491,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651832458.266, "dur": 20.519, "args": { "External id": 22492,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651832484.625, "dur": 28.955, "args": { "External id": 22493,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5084 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651832530.889, "dur": 22.432, "args": { "External id": 22494,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5085 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651832569.480, "dur": 22.605, "args": { "External id": 22495,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5086 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651832609.090, "dur": 18.186, "args": { "External id": 22496,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5087 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651832641.126, "dur": 15.153, "args": { "External id": 22497,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5088 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651832668.047, "dur": 15.828, "args": { "External id": 22498,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5089 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832766.893, "dur": 14.811, "args": { "External id": 22499,"Record function id": 0, "Ev Idx": 5090 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832770.473, "dur": 10.388, "args": { "External id": 22500,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832774.542, "dur": 5.546, "args": { "External id": 22501,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5092 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832776.012, "dur": 3.995, "args": { "External id": 22502,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5093 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832785.363, "dur": 4.919, "args": { "External id": 22503,"Record function id": 0, "Ev Idx": 5094 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832786.733, "dur": 3.116, "args": { "External id": 22504,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832787.700, "dur": 1.720, "args": { "External id": 22505,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5096 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832788.374, "dur": 0.971, "args": { "External id": 22506,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5097 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832793.438, "dur": 5.137, "args": { "External id": 22507,"Record function id": 0, "Ev Idx": 5098 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832794.733, "dur": 3.388, "args": { "External id": 22508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832795.497, "dur": 2.247, "args": { "External id": 22509,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5100 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832796.380, "dur": 1.258, "args": { "External id": 22510,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5101 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832801.713, "dur": 3.476, "args": { "External id": 22511,"Record function id": 0, "Ev Idx": 5102 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832802.743, "dur": 2.034, "args": { "External id": 22512,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832803.291, "dur": 1.056, "args": { "External id": 22513,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5104 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832803.675, "dur": 0.573, "args": { "External id": 22514,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5105 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832808.204, "dur": 3.808, "args": { "External id": 22515,"Record function id": 0, "Ev Idx": 5106 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832809.238, "dur": 2.357, "args": { "External id": 22516,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832810.131, "dur": 1.060, "args": { "External id": 22517,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5108 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832810.500, "dur": 0.626, "args": { "External id": 22518,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5109 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832814.951, "dur": 6.654, "args": { "External id": 22519,"Record function id": 0, "Ev Idx": 5110 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832815.806, "dur": 2.225, "args": { "External id": 22520,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832816.466, "dur": 1.153, "args": { "External id": 22521,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5112 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832816.952, "dur": 0.603, "args": { "External id": 22522,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5113 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832824.810, "dur": 3.902, "args": { "External id": 22523,"Record function id": 0, "Ev Idx": 5114 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832826.112, "dur": 2.212, "args": { "External id": 22524,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832826.836, "dur": 1.057, "args": { "External id": 22525,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5116 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832827.104, "dur": 0.724, "args": { "External id": 22526,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5117 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832831.644, "dur": 23.963, "args": { "External id": 22527,"Record function id": 0, "Ev Idx": 5118 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832832.697, "dur": 22.449, "args": { "External id": 22528,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832853.447, "dur": 1.243, "args": { "External id": 22529,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5120 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832853.953, "dur": 0.664, "args": { "External id": 22530,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5121 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832858.695, "dur": 4.418, "args": { "External id": 22531,"Record function id": 0, "Ev Idx": 5122 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651832859.799, "dur": 2.885, "args": { "External id": 22532,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832860.278, "dur": 2.007, "args": { "External id": 22533,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5124 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651832861.618, "dur": 0.594, "args": { "External id": 22534,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5125 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651832866.624, "dur": 36296.267, "args": { "External id": 22535,"Record function id": 0, "Sequence number": 246549, "Fwd thread id": 1, "Ev Idx": 5126 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651832867.954, "dur": 36286.992, "args": { "External id": 22536,"Sequence number": 246549, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5127 } }, { "ph": "f", "id": 219, "pid": 1336757, "tid": 1381170, "ts": 1295651832867.954, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.4)", "pid": 1336757, "tid": 1381170, "ts": 1295651832900.187, "dur": 38.383, "args": { "External id": 22537,"Record function id": 0, "Ev Idx": 5128 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.4)", "pid": 1336757, "tid": 1381170, "ts": 1295651832946.381, "dur": 105.059, "args": { "External id": 22538,"Record function id": 0, "Ev Idx": 5129 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.4)", "pid": 1336757, "tid": 1381170, "ts": 1295651833059.296, "dur": 36088.243, "args": { "External id": 22539,"Record function id": 0, "Ev Idx": 5130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651833149.505, "dur": 7.296, "args": { "External id": 22540,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651833166.544, "dur": 5.569, "args": { "External id": 22541,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5132 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651833185.955, "dur": 35184.808, "args": { "External id": 22542,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651833200.557, "dur": 35161.459, "args": { "External id": 22543,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651833264.830, "dur": 18.636, "args": { "External id": 22544,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651833289.586, "dur": 35035.184, "args": { "External id": 22545,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651833292.113, "dur": 35032.073, "args": { "External id": 22546,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651833295.567, "dur": 6.784, "args": { "External id": 22547,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651833303.934, "dur": 35017.021, "args": { "External id": 22548,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651868456.367, "dur": 9.197, "args": { "External id": 22549,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651868459.126, "dur": 6.066, "args": { "External id": 22550,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5141 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651868492.289, "dur": 346.143, "args": { "External id": 22551,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5142 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651868518.376, "dur": 316.075, "args": { "External id": 22552,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5143, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651868529.233, "dur": 300.250, "args": { "External id": 22553,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5144 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651868855.169, "dur": 2.393, "args": { "External id": 22554,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5145, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651868910.251, "dur": 6.167, "args": { "External id": 22555,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651868958.209, "dur": 1.161, "args": { "External id": 22556,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651868975.028, "dur": 1.261, "args": { "External id": 22557,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869026.033, "dur": 1.713, "args": { "External id": 22558,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869039.835, "dur": 0.952, "args": { "External id": 22559,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869050.237, "dur": 0.674, "args": { "External id": 22560,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869060.672, "dur": 1.183, "args": { "External id": 22561,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869072.797, "dur": 1.424, "args": { "External id": 22562,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869086.070, "dur": 1.312, "args": { "External id": 22563,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5154 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651869177.860, "dur": 2538.603, "args": { "External id": 22564,"Record function id": 0, "Ev Idx": 5155 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.3)", "pid": 1336757, "tid": 1381170, "ts": 1295651869196.601, "dur": 946.875, "args": { "External id": 22565,"Record function id": 0, "Ev Idx": 5156 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.3)", "pid": 1336757, "tid": 1381170, "ts": 1295651869209.535, "dur": 314.136, "args": { "External id": 22566,"Record function id": 0, "Ev Idx": 5157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651869302.527, "dur": 4.699, "args": { "External id": 22567,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651869311.016, "dur": 1.587, "args": { "External id": 22568,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651869314.508, "dur": 1.025, "args": { "External id": 22569,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651869317.329, "dur": 1.287, "args": { "External id": 22570,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651869320.082, "dur": 1.021, "args": { "External id": 22571,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651869323.817, "dur": 1.019, "args": { "External id": 22572,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651869326.309, "dur": 0.930, "args": { "External id": 22573,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651869328.626, "dur": 1.233, "args": { "External id": 22574,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651869331.511, "dur": 1.142, "args": { "External id": 22575,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651869335.625, "dur": 0.796, "args": { "External id": 22576,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5167 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651869354.152, "dur": 140.448, "args": { "External id": 22577,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651869369.744, "dur": 120.581, "args": { "External id": 22578,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651869384.835, "dur": 11.531, "args": { "External id": 22579,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651869399.141, "dur": 62.515, "args": { "External id": 22580,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651869401.523, "dur": 59.785, "args": { "External id": 22581,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869404.905, "dur": 4.732, "args": { "External id": 22582,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651869411.305, "dur": 49.451, "args": { "External id": 22583,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5174 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.2", "pid": 1336757, "tid": 1381170, "ts": 1295651869604.626, "dur": 531.638, "args": { "External id": 22584,"Record function id": 0, "Ev Idx": 5175 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.2)", "pid": 1336757, "tid": 1381170, "ts": 1295651869619.250, "dur": 504.510, "args": { "External id": 22585,"Record function id": 0, "Ev Idx": 5176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651869674.726, "dur": 4.602, "args": { "External id": 22586,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651869694.336, "dur": 20.544, "args": { "External id": 22587,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869698.663, "dur": 1.811, "args": { "External id": 22588,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869702.302, "dur": 0.752, "args": { "External id": 22589,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869704.341, "dur": 0.282, "args": { "External id": 22590,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869705.261, "dur": 0.200, "args": { "External id": 22591,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869706.150, "dur": 0.597, "args": { "External id": 22592,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869707.802, "dur": 0.292, "args": { "External id": 22593,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869708.986, "dur": 0.239, "args": { "External id": 22594,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869710.008, "dur": 0.279, "args": { "External id": 22595,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869711.594, "dur": 0.696, "args": { "External id": 22596,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651869723.523, "dur": 27.029, "args": { "External id": 22597,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5188 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651869778.548, "dur": 85.495, "args": { "External id": 22598,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651869788.009, "dur": 2.925, "args": { "External id": 22599,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651869795.785, "dur": 9.476, "args": { "External id": 22600,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651869799.851, "dur": 5.020, "args": { "External id": 22601,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869802.933, "dur": 0.471, "args": { "External id": 22602,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651869810.875, "dur": 19.289, "args": { "External id": 22603,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869812.314, "dur": 0.937, "args": { "External id": 22604,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869814.928, "dur": 0.657, "args": { "External id": 22605,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869816.650, "dur": 0.490, "args": { "External id": 22606,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869818.035, "dur": 0.679, "args": { "External id": 22607,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869819.935, "dur": 0.607, "args": { "External id": 22608,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869821.610, "dur": 0.172, "args": { "External id": 22609,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869822.850, "dur": 0.339, "args": { "External id": 22610,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869824.045, "dur": 0.622, "args": { "External id": 22611,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651869825.434, "dur": 0.193, "args": { "External id": 22612,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651869838.705, "dur": 18.107, "args": { "External id": 22613,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5204 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651869905.369, "dur": 145.399, "args": { "External id": 22614,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5205 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651869929.515, "dur": 117.669, "args": { "External id": 22615,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5206, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651869938.289, "dur": 104.363, "args": { "External id": 22616,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5207 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651870070.197, "dur": 1.939, "args": { "External id": 22617,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5208, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651870150.288, "dur": 1546.867, "args": { "External id": 22618,"Sequence number": 246548, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5209 } }, { "ph": "f", "id": 220, "pid": 1336757, "tid": 1381170, "ts": 1295651870150.288, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651870274.148, "dur": 103.870, "args": { "External id": 22619,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5210 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651870413.654, "dur": 38.752, "args": { "External id": 22620,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651870467.529, "dur": 46.300, "args": { "External id": 22621,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651870522.986, "dur": 31.475, "args": { "External id": 22622,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651870561.114, "dur": 44.497, "args": { "External id": 22623,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651870612.159, "dur": 28.768, "args": { "External id": 22624,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651870646.809, "dur": 42.720, "args": { "External id": 22625,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5216 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651870712.004, "dur": 21.976, "args": { "External id": 22626,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5217 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651870751.987, "dur": 28.066, "args": { "External id": 22627,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5218 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651870799.984, "dur": 19.838, "args": { "External id": 22628,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5219 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651870831.670, "dur": 15.447, "args": { "External id": 22629,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651870854.866, "dur": 29.308, "args": { "External id": 22630,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651870887.127, "dur": 31.570, "args": { "External id": 22631,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5222 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651870944.351, "dur": 204.120, "args": { "External id": 22632,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651871056.271, "dur": 7.236, "args": { "External id": 22633,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651871065.671, "dur": 1.966, "args": { "External id": 22634,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5225 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651871180.845, "dur": 25.208, "args": { "External id": 22635,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5226 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651871217.798, "dur": 31.159, "args": { "External id": 22636,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651871259.952, "dur": 45.208, "args": { "External id": 22637,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651871311.432, "dur": 35.910, "args": { "External id": 22638,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651871353.835, "dur": 21.157, "args": { "External id": 22639,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651871378.932, "dur": 29.253, "args": { "External id": 22640,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651871413.787, "dur": 23.743, "args": { "External id": 22641,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651871444.436, "dur": 28.593, "args": { "External id": 22642,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5233 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651871494.599, "dur": 23.324, "args": { "External id": 22643,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5234 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651871534.467, "dur": 23.089, "args": { "External id": 22644,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5235 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651871572.336, "dur": 17.316, "args": { "External id": 22645,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5236 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651871603.528, "dur": 15.058, "args": { "External id": 22646,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5237 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651871647.555, "dur": 21.304, "args": { "External id": 22647,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5238 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871737.899, "dur": 18.031, "args": { "External id": 22648,"Record function id": 0, "Ev Idx": 5239 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871741.073, "dur": 10.774, "args": { "External id": 22649,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871745.189, "dur": 5.826, "args": { "External id": 22650,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5241 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871746.635, "dur": 4.295, "args": { "External id": 22651,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5242 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871759.733, "dur": 4.388, "args": { "External id": 22652,"Record function id": 0, "Ev Idx": 5243 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871761.181, "dur": 2.469, "args": { "External id": 22653,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871761.965, "dur": 1.234, "args": { "External id": 22654,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5245 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871762.314, "dur": 0.784, "args": { "External id": 22655,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5246 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871767.313, "dur": 3.939, "args": { "External id": 22656,"Record function id": 0, "Ev Idx": 5247 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871768.412, "dur": 2.371, "args": { "External id": 22657,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871768.951, "dur": 1.420, "args": { "External id": 22658,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5249 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871769.567, "dur": 0.697, "args": { "External id": 22659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5250 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871774.366, "dur": 3.942, "args": { "External id": 22660,"Record function id": 0, "Ev Idx": 5251 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871775.537, "dur": 2.346, "args": { "External id": 22661,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871776.217, "dur": 1.247, "args": { "External id": 22662,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5253 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871776.667, "dur": 0.688, "args": { "External id": 22663,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5254 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871781.457, "dur": 3.486, "args": { "External id": 22664,"Record function id": 0, "Ev Idx": 5255 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871782.370, "dur": 2.094, "args": { "External id": 22665,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871783.002, "dur": 1.071, "args": { "External id": 22666,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5257 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871783.256, "dur": 0.755, "args": { "External id": 22667,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5258 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871788.071, "dur": 4.440, "args": { "External id": 22668,"Record function id": 0, "Ev Idx": 5259 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871789.390, "dur": 2.698, "args": { "External id": 22669,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871789.876, "dur": 1.820, "args": { "External id": 22670,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5261 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871790.388, "dur": 1.232, "args": { "External id": 22671,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5262 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871795.639, "dur": 3.395, "args": { "External id": 22672,"Record function id": 0, "Ev Idx": 5263 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871796.616, "dur": 1.978, "args": { "External id": 22673,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871797.121, "dur": 1.039, "args": { "External id": 22674,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5265 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871797.411, "dur": 0.675, "args": { "External id": 22675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5266 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871802.076, "dur": 5.939, "args": { "External id": 22676,"Record function id": 0, "Ev Idx": 5267 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871803.059, "dur": 4.511, "args": { "External id": 22677,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871806.079, "dur": 1.070, "args": { "External id": 22678,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5269 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871806.363, "dur": 0.711, "args": { "External id": 22679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5270 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871814.288, "dur": 4.638, "args": { "External id": 22680,"Record function id": 0, "Ev Idx": 5271 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651871815.280, "dur": 3.194, "args": { "External id": 22681,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871815.905, "dur": 2.104, "args": { "External id": 22682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5273 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651871817.404, "dur": 0.504, "args": { "External id": 22683,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5274 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651871822.468, "dur": 36542.344, "args": { "External id": 22684,"Record function id": 0, "Sequence number": 246547, "Fwd thread id": 1, "Ev Idx": 5275 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651871823.598, "dur": 36532.134, "args": { "External id": 22685,"Sequence number": 246547, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5276 } }, { "ph": "f", "id": 221, "pid": 1336757, "tid": 1381170, "ts": 1295651871823.598, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.3)", "pid": 1336757, "tid": 1381170, "ts": 1295651871850.653, "dur": 37.404, "args": { "External id": 22686,"Record function id": 0, "Ev Idx": 5277 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.3)", "pid": 1336757, "tid": 1381170, "ts": 1295651871898.494, "dur": 62.448, "args": { "External id": 22687,"Record function id": 0, "Ev Idx": 5278 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.3)", "pid": 1336757, "tid": 1381170, "ts": 1295651871966.333, "dur": 36382.167, "args": { "External id": 22688,"Record function id": 0, "Ev Idx": 5279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651872098.375, "dur": 7.191, "args": { "External id": 22689,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651872116.621, "dur": 5.294, "args": { "External id": 22690,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5281 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651872140.421, "dur": 35378.106, "args": { "External id": 22691,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651872153.502, "dur": 35357.514, "args": { "External id": 22692,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651872198.627, "dur": 13.893, "args": { "External id": 22693,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651872218.490, "dur": 35253.548, "args": { "External id": 22694,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651872221.178, "dur": 35250.301, "args": { "External id": 22695,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651872224.715, "dur": 22.009, "args": { "External id": 22696,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651872249.157, "dur": 35219.013, "args": { "External id": 22697,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651907602.420, "dur": 8.284, "args": { "External id": 22698,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651907605.165, "dur": 5.267, "args": { "External id": 22699,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5290 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651907635.404, "dur": 414.935, "args": { "External id": 22700,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5291 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651907662.635, "dur": 382.554, "args": { "External id": 22701,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5292, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651907673.015, "dur": 365.874, "args": { "External id": 22702,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5293 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651908069.741, "dur": 2.144, "args": { "External id": 22703,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5294, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908130.302, "dur": 6.512, "args": { "External id": 22704,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908179.976, "dur": 1.451, "args": { "External id": 22705,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908196.507, "dur": 1.190, "args": { "External id": 22706,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908208.706, "dur": 0.999, "args": { "External id": 22707,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908220.111, "dur": 0.980, "args": { "External id": 22708,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908246.496, "dur": 1.640, "args": { "External id": 22709,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908261.861, "dur": 0.951, "args": { "External id": 22710,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908277.536, "dur": 0.985, "args": { "External id": 22711,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908288.205, "dur": 1.387, "args": { "External id": 22712,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5303 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651908379.605, "dur": 2568.617, "args": { "External id": 22713,"Record function id": 0, "Ev Idx": 5304 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.2)", "pid": 1336757, "tid": 1381170, "ts": 1295651908397.827, "dur": 974.291, "args": { "External id": 22714,"Record function id": 0, "Ev Idx": 5305 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.2)", "pid": 1336757, "tid": 1381170, "ts": 1295651908411.475, "dur": 293.093, "args": { "External id": 22715,"Record function id": 0, "Ev Idx": 5306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651908488.396, "dur": 4.514, "args": { "External id": 22716,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651908496.017, "dur": 1.353, "args": { "External id": 22717,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651908499.062, "dur": 1.179, "args": { "External id": 22718,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651908501.716, "dur": 1.148, "args": { "External id": 22719,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651908505.681, "dur": 1.226, "args": { "External id": 22720,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651908508.221, "dur": 0.725, "args": { "External id": 22721,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651908510.346, "dur": 0.646, "args": { "External id": 22722,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651908512.237, "dur": 1.293, "args": { "External id": 22723,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651908516.057, "dur": 1.107, "args": { "External id": 22724,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651908518.460, "dur": 1.040, "args": { "External id": 22725,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5316 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651908536.768, "dur": 141.250, "args": { "External id": 22726,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651908551.574, "dur": 122.113, "args": { "External id": 22727,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651908566.203, "dur": 13.190, "args": { "External id": 22728,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651908582.151, "dur": 62.947, "args": { "External id": 22729,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651908584.670, "dur": 60.041, "args": { "External id": 22730,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908588.076, "dur": 4.934, "args": { "External id": 22731,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651908594.581, "dur": 49.675, "args": { "External id": 22732,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5323 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.1", "pid": 1336757, "tid": 1381170, "ts": 1295651908788.148, "dur": 576.590, "args": { "External id": 22733,"Record function id": 0, "Ev Idx": 5324 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.1)", "pid": 1336757, "tid": 1381170, "ts": 1295651908802.715, "dur": 549.811, "args": { "External id": 22734,"Record function id": 0, "Ev Idx": 5325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651908857.459, "dur": 4.352, "args": { "External id": 22735,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651908883.287, "dur": 23.845, "args": { "External id": 22736,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908889.808, "dur": 1.225, "args": { "External id": 22737,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908892.743, "dur": 0.269, "args": { "External id": 22738,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908894.275, "dur": 0.730, "args": { "External id": 22739,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908896.433, "dur": 0.382, "args": { "External id": 22740,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908897.717, "dur": 0.545, "args": { "External id": 22741,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908899.199, "dur": 0.495, "args": { "External id": 22742,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908901.258, "dur": 0.436, "args": { "External id": 22743,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908902.489, "dur": 0.445, "args": { "External id": 22744,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651908903.736, "dur": 0.282, "args": { "External id": 22745,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651908916.356, "dur": 27.986, "args": { "External id": 22746,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5337 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651908972.246, "dur": 139.653, "args": { "External id": 22747,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651909020.859, "dur": 4.526, "args": { "External id": 22748,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651909031.482, "dur": 10.644, "args": { "External id": 22749,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651909035.736, "dur": 6.004, "args": { "External id": 22750,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651909039.422, "dur": 0.703, "args": { "External id": 22751,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651909049.519, "dur": 22.986, "args": { "External id": 22752,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651909051.350, "dur": 0.634, "args": { "External id": 22753,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651909053.199, "dur": 0.528, "args": { "External id": 22754,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651909054.981, "dur": 0.699, "args": { "External id": 22755,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651909056.788, "dur": 0.715, "args": { "External id": 22756,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651909058.377, "dur": 0.584, "args": { "External id": 22757,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651909060.358, "dur": 0.446, "args": { "External id": 22758,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651909063.796, "dur": 0.260, "args": { "External id": 22759,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651909064.736, "dur": 0.264, "args": { "External id": 22760,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651909066.562, "dur": 0.948, "args": { "External id": 22761,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651909083.510, "dur": 20.575, "args": { "External id": 22762,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5353 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651909157.367, "dur": 126.290, "args": { "External id": 22763,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5354 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651909181.166, "dur": 98.698, "args": { "External id": 22764,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5355, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651909190.268, "dur": 85.403, "args": { "External id": 22765,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5356 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651909299.200, "dur": 1.791, "args": { "External id": 22766,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5357, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651909379.034, "dur": 1549.235, "args": { "External id": 22767,"Sequence number": 246546, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5358 } }, { "ph": "f", "id": 222, "pid": 1336757, "tid": 1381170, "ts": 1295651909379.034, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651909485.494, "dur": 99.814, "args": { "External id": 22768,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5359 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651909621.112, "dur": 41.012, "args": { "External id": 22769,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651909677.199, "dur": 47.156, "args": { "External id": 22770,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651909732.421, "dur": 33.064, "args": { "External id": 22771,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651909771.582, "dur": 43.966, "args": { "External id": 22772,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651909822.659, "dur": 27.731, "args": { "External id": 22773,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651909856.923, "dur": 41.713, "args": { "External id": 22774,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5365 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651909920.820, "dur": 22.673, "args": { "External id": 22775,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5366 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651909959.603, "dur": 70.848, "args": { "External id": 22776,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5367 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651910055.454, "dur": 24.249, "args": { "External id": 22777,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5368 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651910092.640, "dur": 15.701, "args": { "External id": 22778,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651910116.205, "dur": 38.036, "args": { "External id": 22779,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651910157.398, "dur": 33.615, "args": { "External id": 22780,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5371 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651910215.185, "dur": 192.235, "args": { "External id": 22781,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651910310.680, "dur": 6.646, "args": { "External id": 22782,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651910322.564, "dur": 2.403, "args": { "External id": 22783,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5374 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651910438.234, "dur": 26.094, "args": { "External id": 22784,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5375 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651910476.055, "dur": 14.520, "args": { "External id": 22785,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651910498.467, "dur": 38.956, "args": { "External id": 22786,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651910543.173, "dur": 34.393, "args": { "External id": 22787,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651910584.024, "dur": 22.453, "args": { "External id": 22788,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651910610.576, "dur": 29.667, "args": { "External id": 22789,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651910645.639, "dur": 21.027, "args": { "External id": 22790,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651910672.035, "dur": 29.357, "args": { "External id": 22791,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5382 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651910718.297, "dur": 22.256, "args": { "External id": 22792,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5383 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651910757.794, "dur": 23.945, "args": { "External id": 22793,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5384 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651910795.907, "dur": 16.711, "args": { "External id": 22794,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5385 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651910827.839, "dur": 28.551, "args": { "External id": 22795,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5386 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651910879.131, "dur": 18.394, "args": { "External id": 22796,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5387 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651910973.212, "dur": 54.172, "args": { "External id": 22797,"Record function id": 0, "Ev Idx": 5388 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651910976.273, "dur": 49.481, "args": { "External id": 22798,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651910980.491, "dur": 43.783, "args": { "External id": 22799,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5390 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651910981.756, "dur": 41.985, "args": { "External id": 22800,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5391 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911034.121, "dur": 6.400, "args": { "External id": 22801,"Record function id": 0, "Ev Idx": 5392 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911035.878, "dur": 4.193, "args": { "External id": 22802,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911037.563, "dur": 1.957, "args": { "External id": 22803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5394 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911038.561, "dur": 0.884, "args": { "External id": 22804,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5395 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911043.978, "dur": 4.176, "args": { "External id": 22805,"Record function id": 0, "Ev Idx": 5396 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911045.165, "dur": 2.565, "args": { "External id": 22806,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911045.886, "dur": 1.399, "args": { "External id": 22807,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5398 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911046.424, "dur": 0.746, "args": { "External id": 22808,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5399 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911051.437, "dur": 4.078, "args": { "External id": 22809,"Record function id": 0, "Ev Idx": 5400 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911052.514, "dur": 2.555, "args": { "External id": 22810,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911053.296, "dur": 1.353, "args": { "External id": 22811,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5402 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911053.970, "dur": 0.581, "args": { "External id": 22812,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5403 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911058.738, "dur": 3.921, "args": { "External id": 22813,"Record function id": 0, "Ev Idx": 5404 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911059.874, "dur": 2.362, "args": { "External id": 22814,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911060.524, "dur": 1.267, "args": { "External id": 22815,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5406 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911061.010, "dur": 0.673, "args": { "External id": 22816,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5407 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911065.743, "dur": 4.018, "args": { "External id": 22817,"Record function id": 0, "Ev Idx": 5408 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911066.952, "dur": 2.344, "args": { "External id": 22818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911067.478, "dur": 1.396, "args": { "External id": 22819,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5410 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911067.981, "dur": 0.829, "args": { "External id": 22820,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5411 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911072.992, "dur": 3.331, "args": { "External id": 22821,"Record function id": 0, "Ev Idx": 5412 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911073.991, "dur": 1.920, "args": { "External id": 22822,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911074.476, "dur": 0.988, "args": { "External id": 22823,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5414 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911074.770, "dur": 0.619, "args": { "External id": 22824,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5415 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911083.171, "dur": 3.150, "args": { "External id": 22825,"Record function id": 0, "Ev Idx": 5416 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911084.176, "dur": 1.735, "args": { "External id": 22826,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911084.625, "dur": 0.869, "args": { "External id": 22827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5418 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911084.898, "dur": 0.524, "args": { "External id": 22828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5419 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911089.395, "dur": 5.166, "args": { "External id": 22829,"Record function id": 0, "Ev Idx": 5420 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651911090.335, "dur": 3.807, "args": { "External id": 22830,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911090.786, "dur": 2.956, "args": { "External id": 22831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5422 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651911093.235, "dur": 0.440, "args": { "External id": 22832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5423 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651911098.729, "dur": 37258.395, "args": { "External id": 22833,"Record function id": 0, "Sequence number": 246545, "Fwd thread id": 1, "Ev Idx": 5424 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651911099.839, "dur": 37248.990, "args": { "External id": 22834,"Sequence number": 246545, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5425 } }, { "ph": "f", "id": 223, "pid": 1336757, "tid": 1381170, "ts": 1295651911099.839, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.2)", "pid": 1336757, "tid": 1381170, "ts": 1295651911128.473, "dur": 40.171, "args": { "External id": 22835,"Record function id": 0, "Ev Idx": 5426 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.2)", "pid": 1336757, "tid": 1381170, "ts": 1295651911176.442, "dur": 86.256, "args": { "External id": 22836,"Record function id": 0, "Ev Idx": 5427 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.2)", "pid": 1336757, "tid": 1381170, "ts": 1295651911270.224, "dur": 37071.198, "args": { "External id": 22837,"Record function id": 0, "Ev Idx": 5428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651911360.306, "dur": 7.128, "args": { "External id": 22838,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651911379.626, "dur": 4.967, "args": { "External id": 22839,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5430 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651911398.993, "dur": 36035.690, "args": { "External id": 22840,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651911413.345, "dur": 36012.837, "args": { "External id": 22841,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651911457.816, "dur": 14.561, "args": { "External id": 22842,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651911478.201, "dur": 35911.260, "args": { "External id": 22843,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651911480.535, "dur": 35908.262, "args": { "External id": 22844,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651911484.102, "dur": 8.633, "args": { "External id": 22845,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651911494.272, "dur": 35891.112, "args": { "External id": 22846,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651947520.918, "dur": 9.549, "args": { "External id": 22847,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651947523.548, "dur": 6.537, "args": { "External id": 22848,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5439 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651947557.354, "dur": 483.459, "args": { "External id": 22849,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5440 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651947585.513, "dur": 449.940, "args": { "External id": 22850,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5441, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651947596.520, "dur": 432.680, "args": { "External id": 22851,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5442 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651948062.163, "dur": 2.989, "args": { "External id": 22852,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5443, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948126.497, "dur": 6.454, "args": { "External id": 22853,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948177.325, "dur": 1.534, "args": { "External id": 22854,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948195.162, "dur": 1.166, "args": { "External id": 22855,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948207.251, "dur": 0.816, "args": { "External id": 22856,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948218.348, "dur": 0.819, "args": { "External id": 22857,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948243.068, "dur": 1.603, "args": { "External id": 22858,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948258.880, "dur": 1.167, "args": { "External id": 22859,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948270.702, "dur": 2.129, "args": { "External id": 22860,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948281.527, "dur": 1.074, "args": { "External id": 22861,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5452 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651948371.715, "dur": 2566.552, "args": { "External id": 22862,"Record function id": 0, "Ev Idx": 5453 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.1)", "pid": 1336757, "tid": 1381170, "ts": 1295651948390.194, "dur": 972.548, "args": { "External id": 22863,"Record function id": 0, "Ev Idx": 5454 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.1)", "pid": 1336757, "tid": 1381170, "ts": 1295651948404.432, "dur": 289.417, "args": { "External id": 22864,"Record function id": 0, "Ev Idx": 5455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651948481.803, "dur": 3.991, "args": { "External id": 22865,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651948488.908, "dur": 1.367, "args": { "External id": 22866,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651948492.088, "dur": 0.736, "args": { "External id": 22867,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651948494.433, "dur": 0.721, "args": { "External id": 22868,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651948497.837, "dur": 1.465, "args": { "External id": 22869,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651948500.409, "dur": 1.083, "args": { "External id": 22870,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651948503.226, "dur": 1.289, "args": { "External id": 22871,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651948506.098, "dur": 1.467, "args": { "External id": 22872,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651948510.247, "dur": 0.557, "args": { "External id": 22873,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651948512.144, "dur": 0.546, "args": { "External id": 22874,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5465 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651948528.686, "dur": 139.244, "args": { "External id": 22875,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651948544.171, "dur": 119.944, "args": { "External id": 22876,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651948559.823, "dur": 11.961, "args": { "External id": 22877,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651948574.690, "dur": 62.615, "args": { "External id": 22878,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651948577.542, "dur": 59.494, "args": { "External id": 22879,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948581.045, "dur": 5.021, "args": { "External id": 22880,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651948587.870, "dur": 48.703, "args": { "External id": 22881,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5472 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.0", "pid": 1336757, "tid": 1381170, "ts": 1295651948778.798, "dur": 576.484, "args": { "External id": 22882,"Record function id": 0, "Ev Idx": 5473 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.0)", "pid": 1336757, "tid": 1381170, "ts": 1295651948793.987, "dur": 547.826, "args": { "External id": 22883,"Record function id": 0, "Ev Idx": 5474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651948856.354, "dur": 4.845, "args": { "External id": 22884,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651948876.226, "dur": 20.966, "args": { "External id": 22885,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948880.227, "dur": 1.364, "args": { "External id": 22886,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948883.159, "dur": 0.312, "args": { "External id": 22887,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948884.916, "dur": 0.679, "args": { "External id": 22888,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948886.760, "dur": 0.226, "args": { "External id": 22889,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948888.055, "dur": 0.195, "args": { "External id": 22890,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948889.227, "dur": 0.594, "args": { "External id": 22891,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948891.574, "dur": 0.518, "args": { "External id": 22892,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948892.709, "dur": 0.270, "args": { "External id": 22893,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651948893.702, "dur": 0.257, "args": { "External id": 22894,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651948906.884, "dur": 27.346, "args": { "External id": 22895,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5486 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1381170, "ts": 1295651948962.215, "dur": 131.959, "args": { "External id": 22896,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651948971.150, "dur": 3.529, "args": { "External id": 22897,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1381170, "ts": 1295651948979.153, "dur": 50.891, "args": { "External id": 22898,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1381170, "ts": 1295651949022.833, "dur": 6.758, "args": { "External id": 22899,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651949026.890, "dur": 0.768, "args": { "External id": 22900,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1381170, "ts": 1295651949038.145, "dur": 17.731, "args": { "External id": 22901,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651949039.913, "dur": 0.421, "args": { "External id": 22902,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651949041.541, "dur": 0.608, "args": { "External id": 22903,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651949043.440, "dur": 0.461, "args": { "External id": 22904,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651949044.742, "dur": 0.304, "args": { "External id": 22905,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651949046.086, "dur": 0.498, "args": { "External id": 22906,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651949047.570, "dur": 0.531, "args": { "External id": 22907,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651949049.082, "dur": 0.356, "args": { "External id": 22908,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651949050.004, "dur": 0.281, "args": { "External id": 22909,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651949050.834, "dur": 0.345, "args": { "External id": 22910,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651949065.392, "dur": 21.065, "args": { "External id": 22911,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5502 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651949138.711, "dur": 129.831, "args": { "External id": 22912,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5503 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651949164.881, "dur": 99.871, "args": { "External id": 22913,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5504, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1381170, "ts": 1295651949173.985, "dur": 86.471, "args": { "External id": 22914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5505 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651949284.804, "dur": 2.141, "args": { "External id": 22915,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5506, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651949369.617, "dur": 1547.313, "args": { "External id": 22916,"Sequence number": 246544, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5507 } }, { "ph": "f", "id": 224, "pid": 1336757, "tid": 1381170, "ts": 1295651949369.617, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651949481.712, "dur": 101.285, "args": { "External id": 22917,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5508 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651949622.357, "dur": 39.510, "args": { "External id": 22918,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651949676.661, "dur": 50.468, "args": { "External id": 22919,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651949736.878, "dur": 31.890, "args": { "External id": 22920,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651949775.365, "dur": 45.029, "args": { "External id": 22921,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651949827.404, "dur": 27.895, "args": { "External id": 22922,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651949861.891, "dur": 41.111, "args": { "External id": 22923,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5514 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651949924.110, "dur": 22.014, "args": { "External id": 22924,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5515 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651949963.260, "dur": 69.104, "args": { "External id": 22925,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5516 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651950056.702, "dur": 21.157, "args": { "External id": 22926,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5517 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651950090.597, "dur": 15.166, "args": { "External id": 22927,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651950114.310, "dur": 33.287, "args": { "External id": 22928,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651950150.871, "dur": 32.538, "args": { "External id": 22929,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5520 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651950209.307, "dur": 177.780, "args": { "External id": 22930,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651950296.381, "dur": 6.685, "args": { "External id": 22931,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651950305.155, "dur": 1.887, "args": { "External id": 22932,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5523 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651950419.309, "dur": 25.102, "args": { "External id": 22933,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5524 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651950455.517, "dur": 14.719, "args": { "External id": 22934,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651950478.160, "dur": 36.778, "args": { "External id": 22935,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651950519.989, "dur": 33.158, "args": { "External id": 22936,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651950559.561, "dur": 24.620, "args": { "External id": 22937,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651950587.874, "dur": 28.643, "args": { "External id": 22938,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651950621.570, "dur": 24.181, "args": { "External id": 22939,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651950652.274, "dur": 28.568, "args": { "External id": 22940,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5531 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651950700.757, "dur": 22.165, "args": { "External id": 22941,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5532 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651950742.587, "dur": 26.933, "args": { "External id": 22942,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5533 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651950783.732, "dur": 26.528, "args": { "External id": 22943,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5534 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651950836.455, "dur": 21.323, "args": { "External id": 22944,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5535 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651950874.044, "dur": 15.816, "args": { "External id": 22945,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5536 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651950959.595, "dur": 15.626, "args": { "External id": 22946,"Record function id": 0, "Ev Idx": 5537 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651950963.307, "dur": 11.037, "args": { "External id": 22947,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651950967.321, "dur": 6.066, "args": { "External id": 22948,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5539 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651950968.973, "dur": 4.322, "args": { "External id": 22949,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5540 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651950979.008, "dur": 4.703, "args": { "External id": 22950,"Record function id": 0, "Ev Idx": 5541 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651950980.547, "dur": 2.660, "args": { "External id": 22951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651950981.352, "dur": 1.399, "args": { "External id": 22952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5543 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651950981.868, "dur": 0.772, "args": { "External id": 22953,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5544 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951029.764, "dur": 7.080, "args": { "External id": 22954,"Record function id": 0, "Ev Idx": 5545 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951031.800, "dur": 4.341, "args": { "External id": 22955,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951032.955, "dur": 2.319, "args": { "External id": 22956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5547 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951033.912, "dur": 1.160, "args": { "External id": 22957,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5548 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951040.115, "dur": 4.147, "args": { "External id": 22958,"Record function id": 0, "Ev Idx": 5549 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951041.146, "dur": 2.678, "args": { "External id": 22959,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951041.997, "dur": 1.353, "args": { "External id": 22960,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5551 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951042.321, "dur": 0.898, "args": { "External id": 22961,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5552 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951050.450, "dur": 4.013, "args": { "External id": 22962,"Record function id": 0, "Ev Idx": 5553 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951051.737, "dur": 2.288, "args": { "External id": 22963,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951052.306, "dur": 1.207, "args": { "External id": 22964,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5555 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951052.640, "dur": 0.809, "args": { "External id": 22965,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5556 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951057.576, "dur": 3.941, "args": { "External id": 22966,"Record function id": 0, "Ev Idx": 5557 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951058.522, "dur": 2.544, "args": { "External id": 22967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951059.590, "dur": 1.073, "args": { "External id": 22968,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5559 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951060.001, "dur": 0.589, "args": { "External id": 22969,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5560 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951064.639, "dur": 4.187, "args": { "External id": 22970,"Record function id": 0, "Ev Idx": 5561 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951066.323, "dur": 2.029, "args": { "External id": 22971,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951066.839, "dur": 1.090, "args": { "External id": 22972,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5563 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951067.105, "dur": 0.759, "args": { "External id": 22973,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5564 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951071.866, "dur": 3.543, "args": { "External id": 22974,"Record function id": 0, "Ev Idx": 5565 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951072.883, "dur": 2.060, "args": { "External id": 22975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951073.375, "dur": 1.182, "args": { "External id": 22976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5567 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951073.642, "dur": 0.850, "args": { "External id": 22977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5568 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951078.408, "dur": 4.384, "args": { "External id": 22978,"Record function id": 0, "Ev Idx": 5569 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651951079.519, "dur": 2.816, "args": { "External id": 22979,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951079.975, "dur": 1.968, "args": { "External id": 22980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5571 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651951081.179, "dur": 0.659, "args": { "External id": 22981,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5572 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651951086.402, "dur": 36186.441, "args": { "External id": 22982,"Record function id": 0, "Sequence number": 246543, "Fwd thread id": 1, "Ev Idx": 5573 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651951087.720, "dur": 36175.863, "args": { "External id": 22983,"Sequence number": 246543, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5574 } }, { "ph": "f", "id": 225, "pid": 1336757, "tid": 1381170, "ts": 1295651951087.720, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.1)", "pid": 1336757, "tid": 1381170, "ts": 1295651951118.736, "dur": 33.019, "args": { "External id": 22984,"Record function id": 0, "Ev Idx": 5575 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.1)", "pid": 1336757, "tid": 1381170, "ts": 1295651951159.137, "dur": 66.406, "args": { "External id": 22985,"Record function id": 0, "Ev Idx": 5576 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.1)", "pid": 1336757, "tid": 1381170, "ts": 1295651951247.052, "dur": 36008.183, "args": { "External id": 22986,"Record function id": 0, "Ev Idx": 5577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651951336.365, "dur": 10.936, "args": { "External id": 22987,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651951357.584, "dur": 4.999, "args": { "External id": 22988,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5579 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651951376.381, "dur": 35079.829, "args": { "External id": 22989,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651951388.852, "dur": 35059.075, "args": { "External id": 22990,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651951431.608, "dur": 14.994, "args": { "External id": 22991,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651951452.393, "dur": 34954.675, "args": { "External id": 22992,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651951455.886, "dur": 34950.599, "args": { "External id": 22993,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651951458.949, "dur": 5.040, "args": { "External id": 22994,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651951465.566, "dur": 34937.546, "args": { "External id": 22995,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295651986541.903, "dur": 8.956, "args": { "External id": 22996,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651986544.382, "dur": 6.149, "args": { "External id": 22997,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5588 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295651986577.987, "dur": 354.335, "args": { "External id": 22998,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5589 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651986603.990, "dur": 323.387, "args": { "External id": 22999,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5590, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295651986614.428, "dur": 307.149, "args": { "External id": 23000,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5591 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295651986950.527, "dur": 2.070, "args": { "External id": 23001,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5592, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651987043.088, "dur": 6.694, "args": { "External id": 23002,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651987094.800, "dur": 1.259, "args": { "External id": 23003,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651987111.606, "dur": 1.059, "args": { "External id": 23004,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651987124.514, "dur": 0.797, "args": { "External id": 23005,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651987136.530, "dur": 0.946, "args": { "External id": 23006,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651987146.290, "dur": 0.692, "args": { "External id": 23007,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651987156.855, "dur": 1.101, "args": { "External id": 23008,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651987168.018, "dur": 1.140, "args": { "External id": 23009,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651987178.966, "dur": 0.735, "args": { "External id": 23010,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5601 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651987288.681, "dur": 2095.820, "args": { "External id": 23011,"Record function id": 0, "Ev Idx": 5602 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.0)", "pid": 1336757, "tid": 1381170, "ts": 1295651987309.576, "dur": 409.446, "args": { "External id": 23012,"Record function id": 0, "Ev Idx": 5603 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.0)", "pid": 1336757, "tid": 1381170, "ts": 1295651987323.297, "dur": 300.093, "args": { "External id": 23013,"Record function id": 0, "Ev Idx": 5604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651987409.339, "dur": 4.659, "args": { "External id": 23014,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651987417.146, "dur": 1.072, "args": { "External id": 23015,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651987420.798, "dur": 1.049, "args": { "External id": 23016,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651987423.623, "dur": 1.128, "args": { "External id": 23017,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651987426.482, "dur": 0.920, "args": { "External id": 23018,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651987429.194, "dur": 1.392, "args": { "External id": 23019,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651987433.300, "dur": 0.474, "args": { "External id": 23020,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651987434.920, "dur": 0.911, "args": { "External id": 23021,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651987437.404, "dur": 0.928, "args": { "External id": 23022,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651987439.701, "dur": 0.451, "args": { "External id": 23023,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5614 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651987457.146, "dur": 138.054, "args": { "External id": 23024,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651987474.328, "dur": 116.978, "args": { "External id": 23025,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651987488.892, "dur": 11.691, "args": { "External id": 23026,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651987503.519, "dur": 61.596, "args": { "External id": 23027,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651987505.756, "dur": 59.027, "args": { "External id": 23028,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651987509.452, "dur": 4.963, "args": { "External id": 23029,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651987516.115, "dur": 48.192, "args": { "External id": 23030,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5621 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651987725.258, "dur": 1637.946, "args": { "External id": 23031,"Sequence number": 246542, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5622 } }, { "ph": "f", "id": 226, "pid": 1336757, "tid": 1381170, "ts": 1295651987725.258, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651987829.977, "dur": 98.904, "args": { "External id": 23032,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5623 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336757, "tid": 1381170, "ts": 1295651987964.152, "dur": 81.502, "args": { "External id": 23033,"kernel_hash": "cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qt/cqtv52ovuip3ol5r6wg244twcee7ut4ombdtlv3jt7eknkh3yxxu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336757, "tid": 1381170, "ts": 1295651988065.980, "dur": 57.558, "args": { "External id": 23034,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651988133.110, "dur": 36.163, "args": { "External id": 23035,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651988175.733, "dur": 44.823, "args": { "External id": 23036,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651988227.936, "dur": 46.511, "args": { "External id": 23037,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651988283.935, "dur": 41.742, "args": { "External id": 23038,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5629 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336757, "tid": 1381170, "ts": 1295651988351.778, "dur": 23.678, "args": { "External id": 23039,"kernel_hash": "ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/t6/ct6pdrwin6gpbbhb3ubmfazw3qma3gzsewwbv4culi3mwmzponsp.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5630 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336757, "tid": 1381170, "ts": 1295651988392.675, "dur": 29.634, "args": { "External id": 23040,"kernel_hash": "cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/z6/cz6ucetbngq4jgbopxnyfp6gcid5s5ztsv5ncyzjsjt7tfq7ipcf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5631 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651988459.936, "dur": 20.879, "args": { "External id": 23041,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5632 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651988494.086, "dur": 15.894, "args": { "External id": 23042,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651988517.020, "dur": 34.318, "args": { "External id": 23043,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651988554.429, "dur": 36.560, "args": { "External id": 23044,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5635 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336757, "tid": 1381170, "ts": 1295651988617.189, "dur": 173.089, "args": { "External id": 23045,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651988700.984, "dur": 6.091, "args": { "External id": 23046,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651988708.782, "dur": 1.634, "args": { "External id": 23047,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5638 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651988819.561, "dur": 25.575, "args": { "External id": 23048,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5639 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1381170, "ts": 1295651988855.650, "dur": 14.282, "args": { "External id": 23049,"kernel_hash": "cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/p6/cp6j6nhpwjd6mqsefl44gnnjkpkrjt2lnxslguyz45haxtbxbto3.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651988878.309, "dur": 34.762, "args": { "External id": 23050,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651988918.765, "dur": 34.809, "args": { "External id": 23051,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651988959.267, "dur": 61.953, "args": { "External id": 23052,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651989029.570, "dur": 34.805, "args": { "External id": 23053,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651989070.886, "dur": 21.590, "args": { "External id": 23054,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1381170, "ts": 1295651989099.900, "dur": 29.290, "args": { "External id": 23055,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5646 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336757, "tid": 1381170, "ts": 1295651989146.591, "dur": 24.156, "args": { "External id": 23056,"kernel_hash": "cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qs/cqsmoyietljwwem74pqj7rw77h2baol67y2jdqdgbsq7tblfkrf4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5647 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336757, "tid": 1381170, "ts": 1295651989188.841, "dur": 25.712, "args": { "External id": 23057,"kernel_hash": "clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/lr/clrhf26bqgdimbaet5vq7dtthfchb2oh7voorngyplnz6tf2aame.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5648 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336757, "tid": 1381170, "ts": 1295651989246.497, "dur": 20.585, "args": { "External id": 23058,"kernel_hash": "cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/wg/cwgmcdkxcf3qaknrmuortliovuosbdico7imkwflk5thajnwoiwl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5649 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336757, "tid": 1381170, "ts": 1295651989284.586, "dur": 18.882, "args": { "External id": 23059,"kernel_hash": "crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/rq/crqtfcpyfpzzdibd36dgyl26ixald2ez2onww6lldxkvjtmbpczd.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5650 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336757, "tid": 1381170, "ts": 1295651989318.769, "dur": 16.105, "args": { "External id": 23060,"kernel_hash": "cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/em/cemjdqi5ghk3i77b2rg37v3lyvjbugp7r7bobzjsarysugcnwrjj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5651 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989406.957, "dur": 18.016, "args": { "External id": 23061,"Record function id": 0, "Ev Idx": 5652 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989410.437, "dur": 13.626, "args": { "External id": 23062,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989417.535, "dur": 5.629, "args": { "External id": 23063,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5654 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989418.769, "dur": 4.272, "args": { "External id": 23064,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5655 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989428.922, "dur": 4.641, "args": { "External id": 23065,"Record function id": 0, "Ev Idx": 5656 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989430.334, "dur": 2.689, "args": { "External id": 23066,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989430.983, "dur": 1.508, "args": { "External id": 23067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5658 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989431.528, "dur": 0.886, "args": { "External id": 23068,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5659 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989436.835, "dur": 3.926, "args": { "External id": 23069,"Record function id": 0, "Ev Idx": 5660 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989438.217, "dur": 2.110, "args": { "External id": 23070,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989438.725, "dur": 1.155, "args": { "External id": 23071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5662 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989439.354, "dur": 0.442, "args": { "External id": 23072,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5663 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989444.046, "dur": 4.730, "args": { "External id": 23073,"Record function id": 0, "Ev Idx": 5664 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989445.600, "dur": 2.741, "args": { "External id": 23074,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989446.333, "dur": 1.577, "args": { "External id": 23075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5666 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989446.873, "dur": 0.945, "args": { "External id": 23076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5667 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989451.957, "dur": 4.442, "args": { "External id": 23077,"Record function id": 0, "Ev Idx": 5668 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989453.561, "dur": 2.428, "args": { "External id": 23078,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989454.160, "dur": 1.398, "args": { "External id": 23079,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5670 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989454.429, "dur": 1.063, "args": { "External id": 23080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5671 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989459.510, "dur": 3.926, "args": { "External id": 23081,"Record function id": 0, "Ev Idx": 5672 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989460.971, "dur": 2.061, "args": { "External id": 23082,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989461.456, "dur": 1.150, "args": { "External id": 23083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5674 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989461.955, "dur": 0.556, "args": { "External id": 23084,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5675 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989466.818, "dur": 6.873, "args": { "External id": 23085,"Record function id": 0, "Ev Idx": 5676 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989467.987, "dur": 1.798, "args": { "External id": 23086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989468.589, "dur": 0.787, "args": { "External id": 23087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5678 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989468.852, "dur": 0.458, "args": { "External id": 23088,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5679 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989476.919, "dur": 4.012, "args": { "External id": 23089,"Record function id": 0, "Ev Idx": 5680 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989478.593, "dur": 1.924, "args": { "External id": 23090,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989479.093, "dur": 0.997, "args": { "External id": 23091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5682 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989479.369, "dur": 0.654, "args": { "External id": 23092,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5683 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989484.013, "dur": 3.859, "args": { "External id": 23093,"Record function id": 0, "Ev Idx": 5684 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295651989485.472, "dur": 1.988, "args": { "External id": 23094,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989485.942, "dur": 1.102, "args": { "External id": 23095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5686 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295651989486.476, "dur": 0.493, "args": { "External id": 23096,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5687 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651989491.570, "dur": 36315.828, "args": { "External id": 23097,"Record function id": 0, "Sequence number": 246541, "Fwd thread id": 1, "Ev Idx": 5688 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295651989492.811, "dur": 36306.182, "args": { "External id": 23098,"Sequence number": 246541, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5689 } }, { "ph": "f", "id": 227, "pid": 1336757, "tid": 1381170, "ts": 1295651989492.811, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.0)", "pid": 1336757, "tid": 1381170, "ts": 1295651989520.059, "dur": 37.643, "args": { "External id": 23099,"Record function id": 0, "Ev Idx": 5690 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.0)", "pid": 1336757, "tid": 1381170, "ts": 1295651989564.968, "dur": 71.126, "args": { "External id": 23100,"Record function id": 0, "Ev Idx": 5691 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.0)", "pid": 1336757, "tid": 1381170, "ts": 1295651989642.141, "dur": 36149.520, "args": { "External id": 23101,"Record function id": 0, "Ev Idx": 5692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651989731.994, "dur": 6.189, "args": { "External id": 23102,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295651989750.187, "dur": 4.686, "args": { "External id": 23103,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5694 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651989778.819, "dur": 35265.836, "args": { "External id": 23104,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295651989797.929, "dur": 35238.840, "args": { "External id": 23105,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295651989844.920, "dur": 15.217, "args": { "External id": 23106,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295651989866.223, "dur": 35100.956, "args": { "External id": 23107,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295651989868.635, "dur": 35097.930, "args": { "External id": 23108,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295651989872.384, "dur": 5.516, "args": { "External id": 23109,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295651989879.533, "dur": 35084.380, "args": { "External id": 23110,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295652025129.061, "dur": 8.460, "args": { "External id": 23111,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295652025131.617, "dur": 5.605, "args": { "External id": 23112,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5703 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295652025163.800, "dur": 353.284, "args": { "External id": 23113,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5704 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295652025190.828, "dur": 321.792, "args": { "External id": 23114,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5705, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295652025201.756, "dur": 305.473, "args": { "External id": 23115,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5706 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295652025536.434, "dur": 2.386, "args": { "External id": 23116,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5707, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652025595.586, "dur": 6.407, "args": { "External id": 23117,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652025643.846, "dur": 1.575, "args": { "External id": 23118,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652025662.038, "dur": 1.162, "args": { "External id": 23119,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652025675.071, "dur": 0.893, "args": { "External id": 23120,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652025687.638, "dur": 1.148, "args": { "External id": 23121,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652025699.286, "dur": 1.358, "args": { "External id": 23122,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652025711.157, "dur": 0.999, "args": { "External id": 23123,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652025722.847, "dur": 1.211, "args": { "External id": 23124,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652025733.724, "dur": 0.793, "args": { "External id": 23125,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5716 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295652025821.452, "dur": 310.343, "args": { "External id": 23126,"Record function id": 0, "Sequence number": 246540, "Fwd thread id": 1, "Ev Idx": 5717 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336757, "tid": 1381170, "ts": 1295652025824.032, "dur": 299.149, "args": { "External id": 23127,"Sequence number": 246540, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5718 } }, { "ph": "f", "id": 228, "pid": 1336757, "tid": 1381170, "ts": 1295652025824.032, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_0", "pid": 1336757, "tid": 1381170, "ts": 1295652025937.614, "dur": 42.746, "args": { "External id": 23128,"kernel_hash": "ciduma7cu5eg2vb7pjzy37skdgvzi7kewhtlfbbosvucja2bojsj", "grid": "grid(65536000,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "65536000"], "kernel_file": "/tmp/torchinductor_cvm/id/ciduma7cu5eg2vb7pjzy37skdgvzi7kewhtlfbbosvucja2bojsj.py", "kernel_backend": "triton", "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 5719 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_1", "pid": 1336757, "tid": 1381170, "ts": 1295652026037.911, "dur": 29.440, "args": { "External id": 23129,"kernel_hash": "caujkv5qkif2iwziam2o6fi3v6fyh3htmhp45aeprztex4h267rb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/au/caujkv5qkif2iwziam2o6fi3v6fyh3htmhp45aeprztex4h267rb.py", "kernel_backend": "triton", "Input type": ["long int", "c10::BFloat16", "float", "Scalar"], "Input Strides": [[4096, 1], [8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096], [16, 4096, 2048], [32000, 2048], []], "Ev Idx": 5720 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_2", "pid": 1336757, "tid": 1381170, "ts": 1295652026085.411, "dur": 22.036, "args": { "External id": 23130,"kernel_hash": "cfq2gzp6xuirheiddwf3ictuku4xly4uz6pgv7jhaatakl55p4ao", "grid": "grid(65536000,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "65536000"], "kernel_file": "/tmp/torchinductor_cvm/fq/cfq2gzp6xuirheiddwf3ictuku4xly4uz6pgv7jhaatakl55p4ao.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 5721 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295652026144.481, "dur": 14.546, "args": { "External id": 23131,"Record function id": 0, "Ev Idx": 5722 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336757, "tid": 1381170, "ts": 1295652026147.675, "dur": 10.484, "args": { "External id": 23132,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 5723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1381170, "ts": 1295652026151.725, "dur": 5.657, "args": { "External id": 23133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 5724 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1381170, "ts": 1295652026152.876, "dur": 4.407, "args": { "External id": 23134,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 5725 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::root_post_backward_callback", "pid": 1336757, "tid": 1381170, "ts": 1295652026179.521, "dur": 6750.975, "args": { "External id": 23135,"Record function id": 0, "Ev Idx": 5726 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate", "pid": 1336757, "tid": 1381170, "ts": 1295652026197.800, "dur": 53.898, "args": { "External id": 23136,"Record function id": 0, "Ev Idx": 5727 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard", "pid": 1336757, "tid": 1381170, "ts": 1295652026259.174, "dur": 240.958, "args": { "External id": 23137,"Record function id": 0, "Ev Idx": 5728 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce", "pid": 1336757, "tid": 1381170, "ts": 1295652026506.828, "dur": 6161.447, "args": { "External id": 23138,"Record function id": 0, "Ev Idx": 5729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295652026631.325, "dur": 7.079, "args": { "External id": 23139,"Record function id": 0, "Concrete Inputs": ["[336611328]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1381170, "ts": 1295652026649.152, "dur": 5.275, "args": { "External id": 23140,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[336611328], []], "Ev Idx": 5731 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295652026673.158, "dur": 4758.190, "args": { "External id": 23141,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[], [], [], [42076416, 1]], "Input Dims": [[], [], [], [8, 42076416]], "Ev Idx": 5732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336757, "tid": 1381170, "ts": 1295652026691.229, "dur": 4727.859, "args": { "External id": 23142,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[], [], [], [42076416, 1]], "Input Dims": [[], [], [], [8, 42076416]], "Ev Idx": 5733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295652027070.530, "dur": 24.077, "args": { "External id": 23143,"Record function id": 0, "Concrete Inputs": ["[82421]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1381170, "ts": 1295652027185.249, "dur": 4185.909, "args": { "External id": 23144,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[82421], [], [], [], [], [], [], []], "Ev Idx": 5735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1381170, "ts": 1295652027188.382, "dur": 4181.952, "args": { "External id": 23145,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[82421], [], [], [], [], [], []], "Ev Idx": 5736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652027192.352, "dur": 12.621, "args": { "External id": 23146,"Record function id": 0, "Concrete Inputs": ["[82421]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1381170, "ts": 1295652027206.991, "dur": 4157.958, "args": { "External id": 23147,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[82421], [82421], []], "Ev Idx": 5738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1381170, "ts": 1295652031557.621, "dur": 11.045, "args": { "External id": 23148,"Record function id": 0, "Concrete Inputs": ["", "[42076416]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[336611328], [], [], [], [], []], "Ev Idx": 5739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1381170, "ts": 1295652031560.989, "dur": 7.297, "args": { "External id": 23149,"Record function id": 0, "Concrete Inputs": ["[42076416]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5740 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336757, "tid": 1381170, "ts": 1295652031594.535, "dur": 448.933, "args": { "External id": 23150,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[42076416], [336611328], [], [], [], []], "Ev Idx": 5741 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295652031620.905, "dur": 417.126, "args": { "External id": 23151,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 42076416, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[336611328], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5742, "In msg nelems": 336611328 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336757, "tid": 1381170, "ts": 1295652031635.209, "dur": 396.992, "args": { "External id": 23152,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[336611328]], "Ev Idx": 5743 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1381170, "ts": 1295652032062.667, "dur": 2.826, "args": { "External id": 23153,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5744, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032123.056, "dur": 7.023, "args": { "External id": 23154,"Record function id": 0, "Concrete Inputs": ["", "[4000, 2048]", "[2048, 1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032174.625, "dur": 1.391, "args": { "External id": 23155,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8192000"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032190.988, "dur": 1.291, "args": { "External id": 23156,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "8192256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032205.339, "dur": 0.778, "args": { "External id": 23157,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "8716544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032218.376, "dur": 0.748, "args": { "External id": 23158,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "9240832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032244.571, "dur": 1.391, "args": { "External id": 23159,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "9765120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032261.193, "dur": 0.754, "args": { "External id": 23160,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "10289408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032272.985, "dur": 0.926, "args": { "External id": 23161,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "10289664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032283.612, "dur": 1.436, "args": { "External id": 23162,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "11731456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032297.285, "dur": 0.987, "args": { "External id": 23163,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "13173248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032308.307, "dur": 1.389, "args": { "External id": 23164,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "14615040"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032319.812, "dur": 0.829, "args": { "External id": 23165,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "14615296"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032331.230, "dur": 1.071, "args": { "External id": 23166,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "15139584"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032341.173, "dur": 0.953, "args": { "External id": 23167,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "15663872"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032353.139, "dur": 0.959, "args": { "External id": 23168,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "16188160"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032363.827, "dur": 1.528, "args": { "External id": 23169,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "16712448"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032375.367, "dur": 1.181, "args": { "External id": 23170,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "16712704"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032385.855, "dur": 0.844, "args": { "External id": 23171,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "18154496"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032395.855, "dur": 1.632, "args": { "External id": 23172,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "19596288"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032405.982, "dur": 0.546, "args": { "External id": 23173,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "21038080"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032417.160, "dur": 1.087, "args": { "External id": 23174,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "21038336"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032427.031, "dur": 0.733, "args": { "External id": 23175,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "21562624"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032437.119, "dur": 1.438, "args": { "External id": 23176,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "22086912"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032447.786, "dur": 0.847, "args": { "External id": 23177,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "22611200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032458.789, "dur": 1.161, "args": { "External id": 23178,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "23135488"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032468.689, "dur": 0.774, "args": { "External id": 23179,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "23135744"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032479.347, "dur": 1.357, "args": { "External id": 23180,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "24577536"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032490.481, "dur": 1.134, "args": { "External id": 23181,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "26019328"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032501.496, "dur": 1.470, "args": { "External id": 23182,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27461120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032511.830, "dur": 0.689, "args": { "External id": 23183,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "27461376"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032521.441, "dur": 1.124, "args": { "External id": 23184,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "27985664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032533.010, "dur": 0.828, "args": { "External id": 23185,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "28509952"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032542.406, "dur": 1.323, "args": { "External id": 23186,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "29034240"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032553.133, "dur": 0.990, "args": { "External id": 23187,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "29558528"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032563.065, "dur": 1.451, "args": { "External id": 23188,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "29558784"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032573.371, "dur": 0.609, "args": { "External id": 23189,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "31000576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032585.248, "dur": 1.273, "args": { "External id": 23190,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "32442368"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032596.130, "dur": 0.821, "args": { "External id": 23191,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "33884160"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1381170, "ts": 1295652032606.578, "dur": 1.256, "args": { "External id": 23192,"Record function id": 0, "Concrete Inputs": ["", "[4000, 2048]", "[2048, 1]", "33884416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5783 } }, { "ph": "X", "cat": "user_annotation", "name": "ProfilerStep#1023", "pid": 1336757, "tid": 1336757, "ts": 1295649887132.825, "dur": 2164384.674, "args": { "External id": 12289,"Record function id": 0, "Ev Idx": 5784 } }, { "ph": "X", "cat": "user_annotation", "name": "Optimizer.zero_grad#AdamW.zero_grad", "pid": 1336757, "tid": 1336757, "ts": 1295649887168.074, "dur": 581.650, "args": { "External id": 12290,"Record function id": 0, "Ev Idx": 5785 } }, { "ph": "X", "cat": "user_annotation", "name": "enumerate(DataLoader)#_StatefulMultiProcessingDataLoaderIter.__next__", "pid": 1336757, "tid": 1336757, "ts": 1295649887792.428, "dur": 2428.989, "args": { "External id": 12291,"Record function id": 0, "Ev Idx": 5786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649888825.294, "dur": 8.172, "args": { "External id": 12292,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 1336757, "tid": 1336757, "ts": 1295649888854.567, "dur": 6.840, "args": { "External id": 12293,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 5788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649889361.546, "dur": 3.171, "args": { "External id": 12294,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 1336757, "tid": 1336757, "ts": 1295649889373.234, "dur": 3.346, "args": { "External id": 12295,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 5790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649890078.950, "dur": 2.831, "args": { "External id": 12296,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 1336757, "tid": 1336757, "ts": 1295649890091.256, "dur": 2.794, "args": { "External id": 12297,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 5792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295649890635.257, "dur": 13.436, "args": { "External id": 12298,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], []], "Ev Idx": 5793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649890642.597, "dur": 2.415, "args": { "External id": 12299,"Record function id": 0, "Concrete Inputs": ["", "[16, 8192]", "[8192, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 5794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295649890650.569, "dur": 4.728, "args": { "External id": 12300,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "4096", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], []], "Ev Idx": 5795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649890652.619, "dur": 1.500, "args": { "External id": 12301,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 5796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295649890681.901, "dur": 589.435, "args": { "External id": 12302,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], [], []], "Ev Idx": 5797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649890688.992, "dur": 581.441, "args": { "External id": 12303,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], []], "Ev Idx": 5798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649890696.769, "dur": 10.652, "args": { "External id": 12304,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "[4096, 1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649890710.032, "dur": 558.823, "args": { "External id": 12305,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295649890720.195, "dur": 0.470, "args": { "External id": 12306,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 5801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand_as", "pid": 1336757, "tid": 1336757, "ts": 1295649890723.509, "dur": 9.794, "args": { "External id": 12307,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["long int", "long int"], "Input Strides": [[8192, 1], [4096, 1]], "Input Dims": [[16, 4096], [16, 4096]], "Ev Idx": 5802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 1336757, "tid": 1336757, "ts": 1295649890728.971, "dur": 4.184, "args": { "External id": 12308,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], []], "Input Dims": [[16, 4096], [], []], "Ev Idx": 5803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649890732.230, "dur": 0.609, "args": { "External id": 12309,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 5804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1336757, "ts": 1295649890735.479, "dur": 242.491, "args": { "External id": 12310,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 5805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1336757, "ts": 1295649890737.776, "dur": 239.756, "args": { "External id": 12311,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 5806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295649890740.192, "dur": 69.768, "args": { "External id": 12312,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 5807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649890742.403, "dur": 66.951, "args": { "External id": 12313,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649890810.824, "dur": 166.046, "args": { "External id": 12314,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649890980.606, "dur": 282.569, "args": { "External id": 12315,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [4096, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295649891296.246, "dur": 483.413, "args": { "External id": 12316,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], [], []], "Ev Idx": 5811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649891299.174, "dur": 479.783, "args": { "External id": 12317,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], []], "Ev Idx": 5812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649891308.233, "dur": 11.319, "args": { "External id": 12318,"Record function id": 0, "Concrete Inputs": ["[16, 8192]", "[8192, 1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649891321.393, "dur": 454.658, "args": { "External id": 12319,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[8192, 1], [8192, 1], []], "Input Dims": [[16, 8192], [16, 8192], []], "Ev Idx": 5814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::arange", "pid": 1336757, "tid": 1336757, "ts": 1295649891805.164, "dur": 54.984, "args": { "External id": 12320,"Record function id": 0, "Concrete Inputs": ["0", "4096", "", "", "", "False"], "Input type": ["Scalar", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649891809.620, "dur": 4.691, "args": { "External id": 12321,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::arange", "pid": 1336757, "tid": 1336757, "ts": 1295649891817.560, "dur": 42.101, "args": { "External id": 12322,"Record function id": 0, "Concrete Inputs": ["0", "4096", "1", ""], "Input type": ["Scalar", "Scalar", "Scalar", "long int"], "Input Strides": [[], [], [], [1]], "Input Dims": [[], [], [], [0]], "Ev Idx": 5817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295649891822.932, "dur": 7.332, "args": { "External id": 12323,"Record function id": 0, "Concrete Inputs": ["", "[4096]", ""], "Input type": ["long int", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 5818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::repeat", "pid": 1336757, "tid": 1336757, "ts": 1295649891873.862, "dur": 72.698, "args": { "External id": 12324,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4096], []], "Ev Idx": 5819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 1336757, "tid": 1336757, "ts": 1295649891878.909, "dur": 7.806, "args": { "External id": 12325,"Record function id": 0, "Concrete Inputs": ["", "[1, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[4096], [], []], "Ev Idx": 5820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649891884.427, "dur": 1.989, "args": { "External id": 12326,"Record function id": 0, "Concrete Inputs": ["", "[1, 4096]", "[4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[4096], [], [], []], "Ev Idx": 5821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649891887.801, "dur": 3.574, "args": { "External id": 12327,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1336757, "ts": 1295649891893.760, "dur": 3.045, "args": { "External id": 12328,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[4096, 1]], "Input Dims": [[16, 4096]], "Ev Idx": 5823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 1336757, "tid": 1336757, "ts": 1295649891901.884, "dur": 5.733, "args": { "External id": 12329,"Record function id": 0, "Concrete Inputs": ["", "0", "1", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 5824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649891906.843, "dur": 0.624, "args": { "External id": 12330,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1]", "[4096, 1, 4096]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 5825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 1336757, "tid": 1336757, "ts": 1295649891908.675, "dur": 4.172, "args": { "External id": 12331,"Record function id": 0, "Concrete Inputs": ["", "1", "4096", "4096"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 4096], [], [], []], "Input Dims": [[16, 4096, 1], [], [], []], "Ev Idx": 5826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649891911.860, "dur": 0.880, "args": { "External id": 12332,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "[4096, 4096, 4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 4096], [], [], []], "Input Dims": [[16, 4096, 1], [], [], []], "Ev Idx": 5827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand_as", "pid": 1336757, "tid": 1336757, "ts": 1295649891914.867, "dur": 4.234, "args": { "External id": 12333,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["long int", "long int"], "Input Strides": [[4096, 1], [4096, 4096, 4096, 1]], "Input Dims": [[1, 4096], [16, 1, 1, 4096]], "Ev Idx": 5828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 1336757, "tid": 1336757, "ts": 1295649891916.070, "dur": 2.924, "args": { "External id": 12334,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[4096, 1], [], []], "Input Dims": [[1, 4096], [], []], "Ev Idx": 5829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649891917.951, "dur": 0.929, "args": { "External id": 12335,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "[0, 4096, 4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[1, 4096], [], [], []], "Ev Idx": 5830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649891920.341, "dur": 25.530, "args": { "External id": 12336,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 4096, 4096, 1], [0, 4096, 4096, 1], []], "Input Dims": [[16, 1, 1, 4096], [16, 1, 1, 4096], []], "Ev Idx": 5831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295649891955.172, "dur": 69.789, "args": { "External id": 12337,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "3", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[4096, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 5832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649891956.935, "dur": 67.832, "args": { "External id": 12338,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "3", "", "", "", "False", ""], "Input type": ["long int", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[4096, 1], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], []], "Ev Idx": 5833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649891963.795, "dur": 3.016, "args": { "External id": 12339,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "[4096, 1]", "3", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649891967.836, "dur": 56.078, "args": { "External id": 12340,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["int", "long int", "Scalar"], "Input Strides": [[4096, 1], [4096, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5835 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::root_pre_forward", "pid": 1336757, "tid": 1336757, "ts": 1295649892140.820, "dur": 181.865, "args": { "External id": 12341,"Record function id": 0, "Ev Idx": 5836 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::inputs_to_device", "pid": 1336757, "tid": 1336757, "ts": 1295649892220.301, "dur": 87.439, "args": { "External id": 12342,"Record function id": 0, "Ev Idx": 5837 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295649892332.737, "dur": 52.326, "args": { "External id": 12343,"Record function id": 0, "Ev Idx": 5838 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward", "pid": 1336757, "tid": 1336757, "ts": 1295649892394.011, "dur": 9217.343, "args": { "External id": 12344,"Record function id": 0, "Ev Idx": 5839 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather", "pid": 1336757, "tid": 1336757, "ts": 1295649892404.727, "dur": 1326.081, "args": { "External id": 12345,"Record function id": 0, "Ev Idx": 5840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649892527.510, "dur": 8.813, "args": { "External id": 12346,"Record function id": 0, "Concrete Inputs": ["[42076416]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295649892554.328, "dur": 121.067, "args": { "External id": 12347,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["c10::BFloat16", "", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[42076416], [], []], "Ev Idx": 5842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892559.417, "dur": 2.213, "args": { "External id": 12348,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892567.705, "dur": 0.496, "args": { "External id": 12349,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8192000"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892569.367, "dur": 0.377, "args": { "External id": 12350,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "8192256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892570.753, "dur": 1.344, "args": { "External id": 12351,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "8716544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892576.788, "dur": 0.433, "args": { "External id": 12352,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "9240832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892578.072, "dur": 0.162, "args": { "External id": 12353,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "9765120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892578.935, "dur": 2.633, "args": { "External id": 12354,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "10289408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892584.135, "dur": 0.194, "args": { "External id": 12355,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "10289664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892584.894, "dur": 0.165, "args": { "External id": 12356,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11731456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892589.014, "dur": 0.367, "args": { "External id": 12357,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "13173248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892590.441, "dur": 0.282, "args": { "External id": 12358,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "14615040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892591.540, "dur": 1.497, "args": { "External id": 12359,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "14615296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892597.396, "dur": 0.181, "args": { "External id": 12360,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "15139584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892598.565, "dur": 0.322, "args": { "External id": 12361,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "15663872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892599.807, "dur": 2.137, "args": { "External id": 12362,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "16188160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892603.428, "dur": 0.413, "args": { "External id": 12363,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "16712448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892605.630, "dur": 0.384, "args": { "External id": 12364,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "16712704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892609.406, "dur": 0.320, "args": { "External id": 12365,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "18154496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892610.802, "dur": 0.324, "args": { "External id": 12366,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "19596288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892612.451, "dur": 1.823, "args": { "External id": 12367,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "21038080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892617.567, "dur": 0.338, "args": { "External id": 12368,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "21038336"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892618.967, "dur": 0.152, "args": { "External id": 12369,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "21562624"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892620.235, "dur": 2.410, "args": { "External id": 12370,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "22086912"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892623.660, "dur": 0.159, "args": { "External id": 12371,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "22611200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892625.156, "dur": 0.244, "args": { "External id": 12372,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "23135488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892628.955, "dur": 0.667, "args": { "External id": 12373,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "23135744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892630.735, "dur": 0.295, "args": { "External id": 12374,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "24577536"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892632.827, "dur": 1.442, "args": { "External id": 12375,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "26019328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892637.912, "dur": 0.294, "args": { "External id": 12376,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27461120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892639.255, "dur": 0.161, "args": { "External id": 12377,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27461376"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892641.263, "dur": 2.545, "args": { "External id": 12378,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27985664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892644.765, "dur": 0.157, "args": { "External id": 12379,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "28509952"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892645.927, "dur": 0.157, "args": { "External id": 12380,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "29034240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892649.390, "dur": 0.154, "args": { "External id": 12381,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "29558528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892650.496, "dur": 0.342, "args": { "External id": 12382,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29558784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892651.944, "dur": 1.568, "args": { "External id": 12383,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "31000576"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892656.611, "dur": 0.318, "args": { "External id": 12384,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "32442368"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892657.716, "dur": 0.182, "args": { "External id": 12385,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "33884160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892658.742, "dur": 2.467, "args": { "External id": 12386,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "33884416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649892698.716, "dur": 87.096, "args": { "External id": 12387,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 5882 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295649892861.561, "dur": 293.646, "args": { "External id": 12388,"Record function id": 0, "Concrete Inputs": ["", "", "42076416", "8", "4", "15", ""], "Input type": ["TensorList", "", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 5883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649892877.346, "dur": 5.266, "args": { "External id": 12389,"Record function id": 0, "Concrete Inputs": ["[336611328]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295649892889.803, "dur": 11.856, "args": { "External id": 12390,"Record function id": 0, "Concrete Inputs": ["", "0", "168305664", "42076416"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[336611328], [], [], []], "Ev Idx": 5885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295649892894.645, "dur": 6.584, "args": { "External id": 12391,"Record function id": 0, "Concrete Inputs": ["", "0", "168305664", "210382080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[336611328], [], [], [], []], "Ev Idx": 5886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892897.927, "dur": 0.618, "args": { "External id": 12392,"Record function id": 0, "Concrete Inputs": ["", "[42076416]", "[1]", "168305664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[336611328], [], [], []], "Ev Idx": 5887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295649892909.444, "dur": 145.347, "args": { "External id": 12393,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["c10::BFloat16", "", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[42076416], [], []], "Ev Idx": 5888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892911.676, "dur": 0.288, "args": { "External id": 12394,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "168305664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892913.671, "dur": 0.359, "args": { "External id": 12395,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "176497664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892915.166, "dur": 1.131, "args": { "External id": 12396,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "176497920"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892917.837, "dur": 0.665, "args": { "External id": 12397,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "177022208"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892919.583, "dur": 0.264, "args": { "External id": 12398,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "177546496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892921.222, "dur": 0.222, "args": { "External id": 12399,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "178070784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892923.452, "dur": 0.428, "args": { "External id": 12400,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "178595072"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892924.970, "dur": 0.194, "args": { "External id": 12401,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "178595328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892926.597, "dur": 0.758, "args": { "External id": 12402,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "180037120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892928.644, "dur": 0.186, "args": { "External id": 12403,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "181478912"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892929.860, "dur": 1.357, "args": { "External id": 12404,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "182920704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892932.786, "dur": 0.213, "args": { "External id": 12405,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "182920960"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892934.027, "dur": 2.556, "args": { "External id": 12406,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "183445248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892937.509, "dur": 0.336, "args": { "External id": 12407,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "183969536"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892939.421, "dur": 0.314, "args": { "External id": 12408,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "184493824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892943.510, "dur": 0.177, "args": { "External id": 12409,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "185018112"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892945.331, "dur": 0.471, "args": { "External id": 12410,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "185018368"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892947.176, "dur": 0.419, "args": { "External id": 12411,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "186460160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892951.333, "dur": 1.206, "args": { "External id": 12412,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "187901952"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892953.528, "dur": 0.313, "args": { "External id": 12413,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "189343744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892954.889, "dur": 2.492, "args": { "External id": 12414,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "189344000"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892958.383, "dur": 0.314, "args": { "External id": 12415,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "189868288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892959.893, "dur": 0.289, "args": { "External id": 12416,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "190392576"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892963.314, "dur": 0.148, "args": { "External id": 12417,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "190916864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892965.115, "dur": 0.306, "args": { "External id": 12418,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "191441152"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892966.814, "dur": 0.307, "args": { "External id": 12419,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "191441408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892970.764, "dur": 1.113, "args": { "External id": 12420,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "192883200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892973.272, "dur": 0.308, "args": { "External id": 12421,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "194324992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892975.254, "dur": 2.441, "args": { "External id": 12422,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "195766784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892979.001, "dur": 0.192, "args": { "External id": 12423,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "195767040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649892980.486, "dur": 0.327, "args": { "External id": 12424,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "196291328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649893022.957, "dur": 0.890, "args": { "External id": 12425,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "196815616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649893026.969, "dur": 0.164, "args": { "External id": 12426,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "197339904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649893028.454, "dur": 0.463, "args": { "External id": 12427,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "197864192"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649893032.457, "dur": 1.010, "args": { "External id": 12428,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "197864448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649893034.787, "dur": 0.233, "args": { "External id": 12429,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "199306240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649893036.307, "dur": 2.331, "args": { "External id": 12430,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "200748032"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649893039.808, "dur": 0.258, "args": { "External id": 12431,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "202189824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649893041.222, "dur": 0.256, "args": { "External id": 12432,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "202190080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649893077.108, "dur": 61.382, "args": { "External id": 12433,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 5928 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295649893215.036, "dur": 400.754, "args": { "External id": 12434,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[336611328], [42076416], [], [], []], "Ev Idx": 5929 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295649893273.413, "dur": 337.155, "args": { "External id": 12435,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 336611328, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[42076416], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5930, "In msg nelems": 42076416 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295649893287.162, "dur": 317.426, "args": { "External id": 12436,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[42076416]], "Ev Idx": 5931 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295649893645.020, "dur": 2.218, "args": { "External id": 12437,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5932, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out", "pid": 1336757, "tid": 1336757, "ts": 1295649893746.658, "dur": 7672.552, "args": { "External id": 12438,"Record function id": 0, "Ev Idx": 5933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893934.273, "dur": 6.942, "args": { "External id": 12439,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[336611328], []], "Ev Idx": 5934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893944.954, "dur": 1.543, "args": { "External id": 12440,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[65536000], []], "Ev Idx": 5935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893948.750, "dur": 1.039, "args": { "External id": 12441,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893951.789, "dur": 1.962, "args": { "External id": 12442,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893955.386, "dur": 0.920, "args": { "External id": 12443,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893961.857, "dur": 0.649, "args": { "External id": 12444,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893964.347, "dur": 0.652, "args": { "External id": 12445,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893966.768, "dur": 1.966, "args": { "External id": 12446,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893970.441, "dur": 1.140, "args": { "External id": 12447,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893974.943, "dur": 0.956, "args": { "External id": 12448,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893977.796, "dur": 0.456, "args": { "External id": 12449,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649893980.395, "dur": 1.620, "args": { "External id": 12450,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894023.560, "dur": 1.903, "args": { "External id": 12451,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894032.067, "dur": 1.040, "args": { "External id": 12452,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894035.205, "dur": 0.949, "args": { "External id": 12453,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894038.227, "dur": 1.400, "args": { "External id": 12454,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894041.320, "dur": 0.620, "args": { "External id": 12455,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894046.214, "dur": 0.891, "args": { "External id": 12456,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894048.953, "dur": 0.675, "args": { "External id": 12457,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894051.493, "dur": 1.417, "args": { "External id": 12458,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894054.625, "dur": 0.693, "args": { "External id": 12459,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894059.362, "dur": 0.550, "args": { "External id": 12460,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894061.950, "dur": 0.942, "args": { "External id": 12461,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894064.599, "dur": 1.802, "args": { "External id": 12462,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894075.611, "dur": 0.634, "args": { "External id": 12463,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894080.551, "dur": 0.671, "args": { "External id": 12464,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894082.876, "dur": 0.863, "args": { "External id": 12465,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894085.374, "dur": 1.746, "args": { "External id": 12466,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894088.578, "dur": 0.687, "args": { "External id": 12467,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894093.341, "dur": 0.833, "args": { "External id": 12468,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894095.596, "dur": 0.722, "args": { "External id": 12469,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894099.276, "dur": 1.588, "args": { "External id": 12470,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894102.398, "dur": 0.616, "args": { "External id": 12471,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894106.096, "dur": 0.717, "args": { "External id": 12472,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894108.266, "dur": 0.602, "args": { "External id": 12473,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894110.378, "dur": 1.663, "args": { "External id": 12474,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894113.714, "dur": 0.893, "args": { "External id": 12475,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894118.734, "dur": 0.864, "args": { "External id": 12476,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894121.351, "dur": 0.520, "args": { "External id": 12477,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649894123.893, "dur": 1.520, "args": { "External id": 12478,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[65536000], []], "Ev Idx": 5973 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649894153.538, "dur": 7203.648, "args": { "External id": 12479,"Record function id": 0, "Concrete Inputs": ["", "", "1", ""], "Input type": ["c10::BFloat16", "", "Scalar", "TensorList"], "Input Strides": [[42076416, 1], [], [], []], "Input Dims": [[8, 42076416], [], [], []], "Ev Idx": 5974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649894179.176, "dur": 7166.963, "args": { "External id": 12480,"Record function id": 0, "Concrete Inputs": ["", "", "1", ""], "Input type": ["c10::BFloat16", "", "Scalar", "TensorList"], "Input Strides": [[42076416, 1], [], [], []], "Input Dims": [[8, 42076416], [], [], []], "Ev Idx": 5975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649894204.933, "dur": 5.993, "args": { "External id": 12481,"Record function id": 0, "Concrete Inputs": ["[4290]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295649894218.690, "dur": 7081.918, "args": { "External id": 12482,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[4290], [], [], [], [], [], [], []], "Ev Idx": 5977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649894221.183, "dur": 7078.630, "args": { "External id": 12483,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[4290], [], [], [], [], [], []], "Ev Idx": 5978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649894246.094, "dur": 7.805, "args": { "External id": 12484,"Record function id": 0, "Concrete Inputs": ["[4290]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649894256.829, "dur": 7039.196, "args": { "External id": 12485,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[4290], [4290], []], "Ev Idx": 5980 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295649901696.114, "dur": 44.516, "args": { "External id": 12486,"Record function id": 0, "Ev Idx": 5981 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 0/0", "pid": 1336757, "tid": 1336757, "ts": 1295649901741.690, "dur": 220.615, "args": { "External id": 12487,"Record function id": 0, "Ev Idx": 5982 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295649901784.415, "dur": 169.344, "args": { "External id": 12488,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "long int"], "Input Strides": [[2048, 1], [4096, 1]], "Input Dims": [[32000, 2048], [16, 4096]], "Ev Idx": 5983 } }, { "ph": "s", "id": 228, "pid": 1336757, "tid": 1336757, "ts": 1295649901784.415, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_0", "pid": 1336757, "tid": 1336757, "ts": 1295649901863.654, "dur": 54.182, "args": { "External id": 12489,"kernel_hash": "c5avyhm3orrzkqjkvrj7bppgyoz2vz6xunjvoc7l6ifi26al6auf", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/5a/c5avyhm3orrzkqjkvrj7bppgyoz2vz6xunjvoc7l6ifi26al6auf.py", "kernel_backend": "triton", "Input type": ["long int", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096], [32000, 2048], [16, 4096, 2048], []], "Ev Idx": 5984 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295649902072.873, "dur": 56.100, "args": { "External id": 12490,"Record function id": 0, "Ev Idx": 5985 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.0)", "pid": 1336757, "tid": 1336757, "ts": 1295649902140.286, "dur": 6977.870, "args": { "External id": 12491,"Record function id": 0, "Ev Idx": 5986 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.0)", "pid": 1336757, "tid": 1336757, "ts": 1295649902148.795, "dur": 822.553, "args": { "External id": 12492,"Record function id": 0, "Ev Idx": 5987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649902226.433, "dur": 32.671, "args": { "External id": 12493,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295649902278.218, "dur": 52.468, "args": { "External id": 12494,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902288.336, "dur": 2.785, "args": { "External id": 12495,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902294.632, "dur": 0.362, "args": { "External id": 12496,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902297.283, "dur": 2.549, "args": { "External id": 12497,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902302.633, "dur": 0.477, "args": { "External id": 12498,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902305.182, "dur": 0.267, "args": { "External id": 12499,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902310.551, "dur": 0.322, "args": { "External id": 12500,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902313.338, "dur": 0.252, "args": { "External id": 12501,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902316.480, "dur": 1.365, "args": { "External id": 12502,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902322.605, "dur": 0.582, "args": { "External id": 12503,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649902345.070, "dur": 41.685, "args": { "External id": 12504,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5999 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295649902422.226, "dur": 117.766, "args": { "External id": 12505,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649902435.573, "dur": 4.636, "args": { "External id": 12506,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295649902445.638, "dur": 10.900, "args": { "External id": 12507,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295649902450.271, "dur": 5.851, "args": { "External id": 12508,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902454.147, "dur": 0.619, "args": { "External id": 12509,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295649902464.124, "dur": 32.011, "args": { "External id": 12510,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902467.011, "dur": 0.737, "args": { "External id": 12511,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902469.591, "dur": 0.386, "args": { "External id": 12512,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902473.648, "dur": 0.462, "args": { "External id": 12513,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902475.793, "dur": 0.303, "args": { "External id": 12514,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902477.623, "dur": 3.683, "args": { "External id": 12515,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902483.339, "dur": 0.317, "args": { "External id": 12516,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902485.278, "dur": 0.512, "args": { "External id": 12517,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902489.601, "dur": 0.487, "args": { "External id": 12518,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649902491.628, "dur": 0.368, "args": { "External id": 12519,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649902507.821, "dur": 23.827, "args": { "External id": 12520,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6015 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295649902595.903, "dur": 289.630, "args": { "External id": 12521,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6016 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295649902627.217, "dur": 253.663, "args": { "External id": 12522,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6017, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295649902637.935, "dur": 237.687, "args": { "External id": 12523,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6018 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295649902907.501, "dur": 2.396, "args": { "External id": 12524,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6019, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.0)", "pid": 1336757, "tid": 1336757, "ts": 1295649903034.107, "dur": 5792.940, "args": { "External id": 12525,"Record function id": 0, "Ev Idx": 6020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649903135.796, "dur": 6.680, "args": { "External id": 12526,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649903145.962, "dur": 0.961, "args": { "External id": 12527,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649903148.896, "dur": 1.177, "args": { "External id": 12528,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649903154.516, "dur": 2.057, "args": { "External id": 12529,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649903157.877, "dur": 0.766, "args": { "External id": 12530,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649903160.077, "dur": 0.776, "args": { "External id": 12531,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649903163.504, "dur": 0.827, "args": { "External id": 12532,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649903168.479, "dur": 1.630, "args": { "External id": 12533,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649903171.993, "dur": 1.178, "args": { "External id": 12534,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649903174.870, "dur": 0.677, "args": { "External id": 12535,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6030 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649903193.610, "dur": 5590.618, "args": { "External id": 12536,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649903209.695, "dur": 5567.646, "args": { "External id": 12537,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649903251.651, "dur": 17.166, "args": { "External id": 12538,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295649903275.384, "dur": 5467.758, "args": { "External id": 12539,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649903278.442, "dur": 5464.094, "args": { "External id": 12540,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649903285.734, "dur": 8.773, "args": { "External id": 12541,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649903296.857, "dur": 5442.631, "args": { "External id": 12542,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6037 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295649908972.676, "dur": 117.920, "args": { "External id": 12543,"Sequence number": 246541, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6038 } }, { "ph": "s", "id": 227, "pid": 1336757, "tid": 1336757, "ts": 1295649908972.676, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295649909075.656, "dur": 9.720, "args": { "External id": 12544,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649909079.893, "dur": 5.124, "args": { "External id": 12545,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6040 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295649909159.993, "dur": 126.355, "args": { "External id": 12546,"Record function id": 0, "Ev Idx": 6041 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295649909290.900, "dur": 1205.150, "args": { "External id": 12547,"Record function id": 0, "Ev Idx": 6042 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295649909333.556, "dur": 1148.348, "args": { "External id": 12548,"Sequence number": 246542, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6043 } }, { "ph": "s", "id": 226, "pid": 1336757, "tid": 1336757, "ts": 1295649909333.556, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295649909407.709, "dur": 52.105, "args": { "External id": 12549,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649909473.824, "dur": 108.191, "args": { "External id": 12550,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649909591.559, "dur": 39.380, "args": { "External id": 12551,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649909639.436, "dur": 32.122, "args": { "External id": 12552,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6047 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295649909697.622, "dur": 26.899, "args": { "External id": 12553,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6048 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295649909743.272, "dur": 17.979, "args": { "External id": 12554,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6049 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295649909780.422, "dur": 133.942, "args": { "External id": 12555,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295649909835.250, "dur": 11.878, "args": { "External id": 12556,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649909840.564, "dur": 5.476, "args": { "External id": 12557,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649909850.384, "dur": 3.524, "args": { "External id": 12558,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649909855.329, "dur": 1.096, "args": { "External id": 12559,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649909859.482, "dur": 3.011, "args": { "External id": 12560,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649909925.400, "dur": 45.794, "args": { "External id": 12561,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6056 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295649910075.240, "dur": 33.626, "args": { "External id": 12562,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649910118.585, "dur": 47.705, "args": { "External id": 12563,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649910175.896, "dur": 35.772, "args": { "External id": 12564,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6059 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295649910272.289, "dur": 35.625, "args": { "External id": 12565,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649910315.787, "dur": 41.647, "args": { "External id": 12566,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6061 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295649910385.933, "dur": 19.642, "args": { "External id": 12567,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6062 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.0)", "pid": 1336757, "tid": 1336757, "ts": 1295649910564.257, "dur": 83.957, "args": { "External id": 12568,"Record function id": 0, "Ev Idx": 6063 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295649910721.987, "dur": 45.049, "args": { "External id": 12569,"Record function id": 0, "Ev Idx": 6064 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.1)", "pid": 1336757, "tid": 1336757, "ts": 1295649910776.167, "dur": 19240.252, "args": { "External id": 12570,"Record function id": 0, "Ev Idx": 6065 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.1)", "pid": 1336757, "tid": 1336757, "ts": 1295649910785.067, "dur": 1052.823, "args": { "External id": 12571,"Record function id": 0, "Ev Idx": 6066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649910863.423, "dur": 9.243, "args": { "External id": 12572,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295649910887.159, "dur": 48.819, "args": { "External id": 12573,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649910893.224, "dur": 4.255, "args": { "External id": 12574,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649910900.026, "dur": 0.534, "args": { "External id": 12575,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649910902.504, "dur": 0.757, "args": { "External id": 12576,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649910907.647, "dur": 0.176, "args": { "External id": 12577,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649910909.916, "dur": 1.533, "args": { "External id": 12578,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649910917.867, "dur": 0.565, "args": { "External id": 12579,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649910922.331, "dur": 0.387, "args": { "External id": 12580,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649910924.451, "dur": 0.497, "args": { "External id": 12581,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649910927.490, "dur": 2.833, "args": { "External id": 12582,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649910948.712, "dur": 126.572, "args": { "External id": 12583,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6078 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295649911115.135, "dur": 178.021, "args": { "External id": 12584,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649911127.637, "dur": 6.013, "args": { "External id": 12585,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295649911139.156, "dur": 12.358, "args": { "External id": 12586,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295649911144.424, "dur": 6.700, "args": { "External id": 12587,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649911148.360, "dur": 0.997, "args": { "External id": 12588,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295649911159.284, "dur": 28.014, "args": { "External id": 12589,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649911161.512, "dur": 0.765, "args": { "External id": 12590,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649911163.538, "dur": 1.832, "args": { "External id": 12591,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649911166.423, "dur": 2.988, "args": { "External id": 12592,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649911170.641, "dur": 0.195, "args": { "External id": 12593,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649911172.049, "dur": 0.478, "args": { "External id": 12594,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649911176.414, "dur": 0.178, "args": { "External id": 12595,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649911178.135, "dur": 0.371, "args": { "External id": 12596,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649911179.665, "dur": 0.378, "args": { "External id": 12597,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649911183.424, "dur": 0.224, "args": { "External id": 12598,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649911202.330, "dur": 77.913, "args": { "External id": 12599,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6094 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295649911354.928, "dur": 389.850, "args": { "External id": 12600,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6095 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295649911413.128, "dur": 327.105, "args": { "External id": 12601,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6096, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295649911423.844, "dur": 310.809, "args": { "External id": 12602,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6097 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295649911770.054, "dur": 2.357, "args": { "External id": 12603,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6098, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.1)", "pid": 1336757, "tid": 1336757, "ts": 1295649911858.180, "dur": 17914.829, "args": { "External id": 12604,"Record function id": 0, "Ev Idx": 6099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649911946.808, "dur": 6.300, "args": { "External id": 12605,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649911956.628, "dur": 1.277, "args": { "External id": 12606,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649911959.607, "dur": 1.127, "args": { "External id": 12607,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649911962.449, "dur": 1.031, "args": { "External id": 12608,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649911965.134, "dur": 0.845, "args": { "External id": 12609,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649911969.698, "dur": 1.061, "args": { "External id": 12610,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649911972.706, "dur": 0.794, "args": { "External id": 12611,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649911975.239, "dur": 2.958, "args": { "External id": 12612,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649911980.122, "dur": 0.562, "args": { "External id": 12613,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649912047.226, "dur": 1.623, "args": { "External id": 12614,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6109 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649912069.268, "dur": 17654.490, "args": { "External id": 12615,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649912085.722, "dur": 17629.247, "args": { "External id": 12616,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649912109.706, "dur": 14.129, "args": { "External id": 12617,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295649912126.967, "dur": 17550.332, "args": { "External id": 12618,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649912129.823, "dur": 17546.666, "args": { "External id": 12619,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649912136.097, "dur": 5.604, "args": { "External id": 12620,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649912144.094, "dur": 17528.450, "args": { "External id": 12621,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6116 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295649929921.000, "dur": 39.285, "args": { "External id": 12622,"Sequence number": 246543, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6117 } }, { "ph": "s", "id": 225, "pid": 1336757, "tid": 1336757, "ts": 1295649929921.000, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295649929945.991, "dur": 9.632, "args": { "External id": 12623,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649929950.060, "dur": 5.360, "args": { "External id": 12624,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6119 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295649930063.277, "dur": 84.686, "args": { "External id": 12625,"Record function id": 0, "Ev Idx": 6120 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295649930149.987, "dur": 1184.821, "args": { "External id": 12626,"Record function id": 0, "Ev Idx": 6121 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295649930193.349, "dur": 1123.323, "args": { "External id": 12627,"Sequence number": 246544, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6122 } }, { "ph": "s", "id": 224, "pid": 1336757, "tid": 1336757, "ts": 1295649930193.349, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295649930301.716, "dur": 58.552, "args": { "External id": 12628,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649930379.239, "dur": 114.482, "args": { "External id": 12629,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649930503.392, "dur": 38.512, "args": { "External id": 12630,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649930547.071, "dur": 30.924, "args": { "External id": 12631,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6126 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295649930609.782, "dur": 28.851, "args": { "External id": 12632,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6127 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295649930654.724, "dur": 19.702, "args": { "External id": 12633,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6128 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295649930692.235, "dur": 136.526, "args": { "External id": 12634,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295649930746.999, "dur": 13.120, "args": { "External id": 12635,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649930752.872, "dur": 6.369, "args": { "External id": 12636,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649930763.163, "dur": 4.847, "args": { "External id": 12637,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649930769.486, "dur": 3.263, "args": { "External id": 12638,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649930775.072, "dur": 3.374, "args": { "External id": 12639,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649930839.292, "dur": 44.246, "args": { "External id": 12640,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6135 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295649930913.965, "dur": 28.118, "args": { "External id": 12641,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649930950.340, "dur": 79.946, "args": { "External id": 12642,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649931040.317, "dur": 39.522, "args": { "External id": 12643,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6138 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295649931107.120, "dur": 27.007, "args": { "External id": 12644,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649931140.433, "dur": 33.782, "args": { "External id": 12645,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6140 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295649931192.995, "dur": 22.316, "args": { "External id": 12646,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6141 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.1)", "pid": 1336757, "tid": 1336757, "ts": 1295649931413.014, "dur": 84.252, "args": { "External id": 12647,"Record function id": 0, "Ev Idx": 6142 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295649931573.336, "dur": 46.513, "args": { "External id": 12648,"Record function id": 0, "Ev Idx": 6143 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.2)", "pid": 1336757, "tid": 1336757, "ts": 1295649931629.182, "dur": 18220.812, "args": { "External id": 12649,"Record function id": 0, "Ev Idx": 6144 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.2)", "pid": 1336757, "tid": 1336757, "ts": 1295649931637.662, "dur": 978.482, "args": { "External id": 12650,"Record function id": 0, "Ev Idx": 6145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649931720.670, "dur": 10.322, "args": { "External id": 12651,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295649931744.190, "dur": 37.084, "args": { "External id": 12652,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931749.534, "dur": 2.515, "args": { "External id": 12653,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931757.010, "dur": 0.712, "args": { "External id": 12654,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931758.977, "dur": 0.477, "args": { "External id": 12655,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931760.922, "dur": 0.597, "args": { "External id": 12656,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931764.502, "dur": 0.650, "args": { "External id": 12657,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931766.248, "dur": 0.438, "args": { "External id": 12658,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931767.829, "dur": 4.043, "args": { "External id": 12659,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931773.567, "dur": 0.437, "args": { "External id": 12660,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931775.273, "dur": 0.529, "args": { "External id": 12661,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649931793.778, "dur": 45.016, "args": { "External id": 12662,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6157 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295649931870.489, "dur": 112.170, "args": { "External id": 12663,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649931884.028, "dur": 4.147, "args": { "External id": 12664,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295649931893.069, "dur": 11.174, "args": { "External id": 12665,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295649931898.262, "dur": 5.595, "args": { "External id": 12666,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931901.977, "dur": 0.664, "args": { "External id": 12667,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295649931911.685, "dur": 29.361, "args": { "External id": 12668,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931913.448, "dur": 2.598, "args": { "External id": 12669,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931917.215, "dur": 0.424, "args": { "External id": 12670,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931918.770, "dur": 0.551, "args": { "External id": 12671,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931923.357, "dur": 1.466, "args": { "External id": 12672,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931926.095, "dur": 0.626, "args": { "External id": 12673,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931928.252, "dur": 0.482, "args": { "External id": 12674,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931931.841, "dur": 0.148, "args": { "External id": 12675,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931933.089, "dur": 0.369, "args": { "External id": 12676,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649931934.443, "dur": 2.705, "args": { "External id": 12677,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649931952.344, "dur": 22.145, "args": { "External id": 12678,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6173 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295649932081.388, "dur": 423.969, "args": { "External id": 12679,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6174 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295649932113.569, "dur": 385.731, "args": { "External id": 12680,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6175, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295649932126.837, "dur": 364.707, "args": { "External id": 12681,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6176 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295649932535.759, "dur": 2.857, "args": { "External id": 12682,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6177, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.2)", "pid": 1336757, "tid": 1336757, "ts": 1295649932637.401, "dur": 17006.372, "args": { "External id": 12683,"Record function id": 0, "Ev Idx": 6178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649932738.154, "dur": 6.573, "args": { "External id": 12684,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649932748.257, "dur": 1.299, "args": { "External id": 12685,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649932751.759, "dur": 2.850, "args": { "External id": 12686,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649932756.377, "dur": 0.962, "args": { "External id": 12687,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649932758.755, "dur": 1.080, "args": { "External id": 12688,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649932761.246, "dur": 1.045, "args": { "External id": 12689,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649932767.678, "dur": 0.960, "args": { "External id": 12690,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649932770.255, "dur": 1.868, "args": { "External id": 12691,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649932773.809, "dur": 1.098, "args": { "External id": 12692,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649932776.552, "dur": 0.981, "args": { "External id": 12693,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6188 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649932798.543, "dur": 16796.028, "args": { "External id": 12694,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649932814.920, "dur": 16770.522, "args": { "External id": 12695,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649932836.448, "dur": 14.057, "args": { "External id": 12696,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295649932853.545, "dur": 16694.426, "args": { "External id": 12697,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649932856.050, "dur": 16691.071, "args": { "External id": 12698,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649932862.519, "dur": 6.494, "args": { "External id": 12699,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649932870.804, "dur": 16672.339, "args": { "External id": 12700,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6195 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295649949785.553, "dur": 40.330, "args": { "External id": 12701,"Sequence number": 246545, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6196 } }, { "ph": "s", "id": 223, "pid": 1336757, "tid": 1336757, "ts": 1295649949785.553, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295649949810.906, "dur": 9.934, "args": { "External id": 12702,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649949815.245, "dur": 5.325, "args": { "External id": 12703,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6198 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295649949893.193, "dur": 79.140, "args": { "External id": 12704,"Record function id": 0, "Ev Idx": 6199 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295649949974.135, "dur": 1209.014, "args": { "External id": 12705,"Record function id": 0, "Ev Idx": 6200 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295649950069.827, "dur": 1098.652, "args": { "External id": 12706,"Sequence number": 246546, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6201 } }, { "ph": "s", "id": 222, "pid": 1336757, "tid": 1336757, "ts": 1295649950069.827, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295649950141.097, "dur": 49.096, "args": { "External id": 12707,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649950205.475, "dur": 128.126, "args": { "External id": 12708,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649950350.859, "dur": 53.465, "args": { "External id": 12709,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649950413.827, "dur": 32.438, "args": { "External id": 12710,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6205 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295649950478.704, "dur": 27.945, "args": { "External id": 12711,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6206 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295649950525.180, "dur": 16.615, "args": { "External id": 12712,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6207 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295649950563.352, "dur": 132.865, "args": { "External id": 12713,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295649950615.185, "dur": 12.005, "args": { "External id": 12714,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649950620.554, "dur": 5.729, "args": { "External id": 12715,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649950630.259, "dur": 4.769, "args": { "External id": 12716,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649950636.653, "dur": 1.043, "args": { "External id": 12717,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649950640.073, "dur": 4.361, "args": { "External id": 12718,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649950707.177, "dur": 46.846, "args": { "External id": 12719,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6214 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295649950785.283, "dur": 30.227, "args": { "External id": 12720,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649950824.561, "dur": 41.762, "args": { "External id": 12721,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649950875.226, "dur": 34.920, "args": { "External id": 12722,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6217 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295649950932.143, "dur": 27.153, "args": { "External id": 12723,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295649950965.539, "dur": 79.547, "args": { "External id": 12724,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6219 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295649951073.583, "dur": 23.226, "args": { "External id": 12725,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6220 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.2)", "pid": 1336757, "tid": 1336757, "ts": 1295649951277.945, "dur": 102.873, "args": { "External id": 12726,"Record function id": 0, "Ev Idx": 6221 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295649951462.541, "dur": 47.679, "args": { "External id": 12727,"Record function id": 0, "Ev Idx": 6222 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.3)", "pid": 1336757, "tid": 1336757, "ts": 1295649951519.595, "dur": 91929.047, "args": { "External id": 12728,"Record function id": 0, "Ev Idx": 6223 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.3)", "pid": 1336757, "tid": 1336757, "ts": 1295649951527.293, "dur": 1068.354, "args": { "External id": 12729,"Record function id": 0, "Ev Idx": 6224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649951610.407, "dur": 10.488, "args": { "External id": 12730,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295649951635.224, "dur": 44.912, "args": { "External id": 12731,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951641.873, "dur": 2.456, "args": { "External id": 12732,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951649.186, "dur": 0.278, "args": { "External id": 12733,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951651.287, "dur": 0.499, "args": { "External id": 12734,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951657.887, "dur": 0.636, "args": { "External id": 12735,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951661.877, "dur": 0.802, "args": { "External id": 12736,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951664.102, "dur": 0.623, "args": { "External id": 12737,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951666.645, "dur": 3.976, "args": { "External id": 12738,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951671.948, "dur": 0.323, "args": { "External id": 12739,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951673.756, "dur": 0.193, "args": { "External id": 12740,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649951691.557, "dur": 43.843, "args": { "External id": 12741,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6236 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295649951769.273, "dur": 122.411, "args": { "External id": 12742,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649951780.999, "dur": 4.417, "args": { "External id": 12743,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295649951790.509, "dur": 11.280, "args": { "External id": 12744,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295649951795.601, "dur": 5.799, "args": { "External id": 12745,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951799.347, "dur": 0.691, "args": { "External id": 12746,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295649951808.812, "dur": 31.715, "args": { "External id": 12747,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951811.390, "dur": 2.928, "args": { "External id": 12748,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951815.430, "dur": 0.516, "args": { "External id": 12749,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951817.806, "dur": 0.178, "args": { "External id": 12750,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951821.325, "dur": 1.321, "args": { "External id": 12751,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951824.580, "dur": 0.553, "args": { "External id": 12752,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951826.874, "dur": 0.147, "args": { "External id": 12753,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951830.766, "dur": 0.427, "args": { "External id": 12754,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951832.228, "dur": 0.198, "args": { "External id": 12755,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649951834.170, "dur": 2.144, "args": { "External id": 12756,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649951861.914, "dur": 21.743, "args": { "External id": 12757,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6252 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295649951946.572, "dur": 527.466, "args": { "External id": 12758,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6253 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295649951978.052, "dur": 489.047, "args": { "External id": 12759,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6254, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295649952034.348, "dur": 425.672, "args": { "External id": 12760,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6255 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295649952506.181, "dur": 2.637, "args": { "External id": 12761,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6256, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.3)", "pid": 1336757, "tid": 1336757, "ts": 1295649952619.492, "dur": 90554.113, "args": { "External id": 12762,"Record function id": 0, "Ev Idx": 6257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649952721.631, "dur": 7.202, "args": { "External id": 12763,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649952732.594, "dur": 1.268, "args": { "External id": 12764,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649952735.971, "dur": 2.111, "args": { "External id": 12765,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649952739.770, "dur": 1.374, "args": { "External id": 12766,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649952742.818, "dur": 0.784, "args": { "External id": 12767,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649952745.304, "dur": 1.014, "args": { "External id": 12768,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649952750.139, "dur": 0.922, "args": { "External id": 12769,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649952753.062, "dur": 1.769, "args": { "External id": 12770,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649952756.268, "dur": 0.920, "args": { "External id": 12771,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295649952759.048, "dur": 0.644, "args": { "External id": 12772,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6267 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649952780.937, "dur": 90333.128, "args": { "External id": 12773,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649952798.863, "dur": 90303.546, "args": { "External id": 12774,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295649952819.853, "dur": 15.449, "args": { "External id": 12775,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295649952838.343, "dur": 90220.395, "args": { "External id": 12776,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295649952841.010, "dur": 90216.588, "args": { "External id": 12777,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295649952848.408, "dur": 6.081, "args": { "External id": 12778,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295649952856.450, "dur": 90196.528, "args": { "External id": 12779,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6274 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650043364.980, "dur": 53.405, "args": { "External id": 12780,"Sequence number": 246547, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6275 } }, { "ph": "s", "id": 221, "pid": 1336757, "tid": 1336757, "ts": 1295650043364.980, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650043401.451, "dur": 11.661, "args": { "External id": 12781,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650043406.098, "dur": 6.650, "args": { "External id": 12782,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6277 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650043491.595, "dur": 83.257, "args": { "External id": 12783,"Record function id": 0, "Ev Idx": 6278 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650043577.024, "dur": 1249.879, "args": { "External id": 12784,"Record function id": 0, "Ev Idx": 6279 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650043620.089, "dur": 1191.070, "args": { "External id": 12785,"Sequence number": 246548, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6280 } }, { "ph": "s", "id": 220, "pid": 1336757, "tid": 1336757, "ts": 1295650043620.089, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650043690.045, "dur": 51.511, "args": { "External id": 12786,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650043754.150, "dur": 111.422, "args": { "External id": 12787,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650043881.925, "dur": 38.802, "args": { "External id": 12788,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650043927.861, "dur": 34.518, "args": { "External id": 12789,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6284 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650044036.344, "dur": 36.564, "args": { "External id": 12790,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6285 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650044092.119, "dur": 17.070, "args": { "External id": 12791,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6286 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650044132.497, "dur": 175.841, "args": { "External id": 12792,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650044186.432, "dur": 12.944, "args": { "External id": 12793,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650044191.638, "dur": 6.903, "args": { "External id": 12794,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650044202.729, "dur": 5.382, "args": { "External id": 12795,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650044209.619, "dur": 1.336, "args": { "External id": 12796,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650044216.054, "dur": 4.803, "args": { "External id": 12797,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650044324.493, "dur": 74.602, "args": { "External id": 12798,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6293 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650044439.986, "dur": 34.979, "args": { "External id": 12799,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650044484.842, "dur": 43.173, "args": { "External id": 12800,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650044563.771, "dur": 36.411, "args": { "External id": 12801,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6296 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650044629.256, "dur": 31.185, "args": { "External id": 12802,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650044665.910, "dur": 35.058, "args": { "External id": 12803,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6298 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650044720.145, "dur": 21.469, "args": { "External id": 12804,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6299 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.3)", "pid": 1336757, "tid": 1336757, "ts": 1295650044897.352, "dur": 77.944, "args": { "External id": 12805,"Record function id": 0, "Ev Idx": 6300 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650045115.969, "dur": 51.283, "args": { "External id": 12806,"Record function id": 0, "Ev Idx": 6301 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.4)", "pid": 1336757, "tid": 1336757, "ts": 1295650045177.442, "dur": 18101.609, "args": { "External id": 12807,"Record function id": 0, "Ev Idx": 6302 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.4)", "pid": 1336757, "tid": 1336757, "ts": 1295650045185.923, "dur": 982.222, "args": { "External id": 12808,"Record function id": 0, "Ev Idx": 6303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650045302.368, "dur": 12.287, "args": { "External id": 12809,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650045332.132, "dur": 48.526, "args": { "External id": 12810,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045339.248, "dur": 2.605, "args": { "External id": 12811,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045347.399, "dur": 0.420, "args": { "External id": 12812,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045350.090, "dur": 0.681, "args": { "External id": 12813,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045352.988, "dur": 0.593, "args": { "External id": 12814,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045358.009, "dur": 0.552, "args": { "External id": 12815,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045360.569, "dur": 0.443, "args": { "External id": 12816,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045363.285, "dur": 4.482, "args": { "External id": 12817,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045369.476, "dur": 0.869, "args": { "External id": 12818,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045372.699, "dur": 0.493, "args": { "External id": 12819,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650045395.855, "dur": 51.688, "args": { "External id": 12820,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6315 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650045484.172, "dur": 113.229, "args": { "External id": 12821,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650045496.320, "dur": 5.686, "args": { "External id": 12822,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650045507.054, "dur": 10.604, "args": { "External id": 12823,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650045511.986, "dur": 5.258, "args": { "External id": 12824,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045515.619, "dur": 0.383, "args": { "External id": 12825,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650045524.668, "dur": 31.279, "args": { "External id": 12826,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045527.138, "dur": 2.955, "args": { "External id": 12827,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045531.238, "dur": 0.586, "args": { "External id": 12828,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045533.695, "dur": 0.575, "args": { "External id": 12829,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045537.008, "dur": 1.874, "args": { "External id": 12830,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045540.391, "dur": 0.338, "args": { "External id": 12831,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045542.315, "dur": 0.320, "args": { "External id": 12832,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045545.865, "dur": 0.350, "args": { "External id": 12833,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045547.123, "dur": 0.185, "args": { "External id": 12834,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650045549.144, "dur": 2.896, "args": { "External id": 12835,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650045567.100, "dur": 22.401, "args": { "External id": 12836,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6331 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650045654.865, "dur": 410.746, "args": { "External id": 12837,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6332 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650045688.107, "dur": 371.595, "args": { "External id": 12838,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6333, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650045701.161, "dur": 352.009, "args": { "External id": 12839,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6334 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650046093.142, "dur": 2.559, "args": { "External id": 12840,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6335, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.4)", "pid": 1336757, "tid": 1336757, "ts": 1295650046189.823, "dur": 16838.724, "args": { "External id": 12841,"Record function id": 0, "Ev Idx": 6336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650046330.562, "dur": 7.707, "args": { "External id": 12842,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650046343.155, "dur": 1.812, "args": { "External id": 12843,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650046347.449, "dur": 2.483, "args": { "External id": 12844,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650046352.921, "dur": 1.114, "args": { "External id": 12845,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650046356.096, "dur": 1.310, "args": { "External id": 12846,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650046359.618, "dur": 1.009, "args": { "External id": 12847,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650046365.864, "dur": 1.183, "args": { "External id": 12848,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650046369.693, "dur": 2.327, "args": { "External id": 12849,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650046374.789, "dur": 1.160, "args": { "External id": 12850,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650046378.523, "dur": 1.308, "args": { "External id": 12851,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6346 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650046405.446, "dur": 16541.701, "args": { "External id": 12852,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650046423.187, "dur": 16511.104, "args": { "External id": 12853,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650046448.460, "dur": 15.481, "args": { "External id": 12854,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650046467.346, "dur": 16429.864, "args": { "External id": 12855,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650046469.904, "dur": 16426.455, "args": { "External id": 12856,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650046476.123, "dur": 6.138, "args": { "External id": 12857,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650046484.225, "dur": 16408.829, "args": { "External id": 12858,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6353 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650063182.017, "dur": 42.516, "args": { "External id": 12859,"Sequence number": 246549, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6354 } }, { "ph": "s", "id": 219, "pid": 1336757, "tid": 1336757, "ts": 1295650063182.017, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650063209.643, "dur": 10.156, "args": { "External id": 12860,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650063213.667, "dur": 5.896, "args": { "External id": 12861,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6356 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650063332.157, "dur": 91.040, "args": { "External id": 12862,"Record function id": 0, "Ev Idx": 6357 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650063425.540, "dur": 1208.670, "args": { "External id": 12863,"Record function id": 0, "Ev Idx": 6358 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650063469.701, "dur": 1149.868, "args": { "External id": 12864,"Sequence number": 246550, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6359 } }, { "ph": "s", "id": 218, "pid": 1336757, "tid": 1336757, "ts": 1295650063469.701, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650063543.193, "dur": 46.990, "args": { "External id": 12865,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650063604.050, "dur": 107.345, "args": { "External id": 12866,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650063721.677, "dur": 38.385, "args": { "External id": 12867,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650063769.199, "dur": 30.948, "args": { "External id": 12868,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6363 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650063825.568, "dur": 27.491, "args": { "External id": 12869,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6364 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650063870.948, "dur": 15.651, "args": { "External id": 12870,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6365 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650063905.133, "dur": 176.112, "args": { "External id": 12871,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650063954.483, "dur": 11.996, "args": { "External id": 12872,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650063959.477, "dur": 6.219, "args": { "External id": 12873,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650063969.318, "dur": 5.951, "args": { "External id": 12874,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650063976.566, "dur": 1.731, "args": { "External id": 12875,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650064019.610, "dur": 6.087, "args": { "External id": 12876,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650064093.794, "dur": 52.392, "args": { "External id": 12877,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6372 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650064180.472, "dur": 28.845, "args": { "External id": 12878,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650064219.266, "dur": 74.917, "args": { "External id": 12879,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650064309.029, "dur": 48.973, "args": { "External id": 12880,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6375 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650064400.009, "dur": 40.999, "args": { "External id": 12881,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650064448.989, "dur": 44.779, "args": { "External id": 12882,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6377 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650064516.558, "dur": 21.935, "args": { "External id": 12883,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6378 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.4)", "pid": 1336757, "tid": 1336757, "ts": 1295650064704.614, "dur": 82.352, "args": { "External id": 12884,"Record function id": 0, "Ev Idx": 6379 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650064860.655, "dur": 47.924, "args": { "External id": 12885,"Record function id": 0, "Ev Idx": 6380 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.5)", "pid": 1336757, "tid": 1336757, "ts": 1295650064917.519, "dur": 18008.444, "args": { "External id": 12886,"Record function id": 0, "Ev Idx": 6381 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.5)", "pid": 1336757, "tid": 1336757, "ts": 1295650064926.895, "dur": 913.182, "args": { "External id": 12887,"Record function id": 0, "Ev Idx": 6382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650065056.409, "dur": 10.997, "args": { "External id": 12888,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650065081.882, "dur": 42.095, "args": { "External id": 12889,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065087.479, "dur": 2.328, "args": { "External id": 12890,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065097.926, "dur": 0.500, "args": { "External id": 12891,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065099.488, "dur": 0.651, "args": { "External id": 12892,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065101.566, "dur": 0.552, "args": { "External id": 12893,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065105.389, "dur": 0.710, "args": { "External id": 12894,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065108.141, "dur": 0.378, "args": { "External id": 12895,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065109.745, "dur": 4.199, "args": { "External id": 12896,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065115.598, "dur": 0.481, "args": { "External id": 12897,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065117.282, "dur": 0.581, "args": { "External id": 12898,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650065137.013, "dur": 42.160, "args": { "External id": 12899,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6394 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650065212.841, "dur": 164.402, "args": { "External id": 12900,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650065223.830, "dur": 21.609, "args": { "External id": 12901,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650065254.005, "dur": 13.924, "args": { "External id": 12902,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650065259.583, "dur": 7.819, "args": { "External id": 12903,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065264.440, "dur": 0.913, "args": { "External id": 12904,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650065277.668, "dur": 41.017, "args": { "External id": 12905,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065280.653, "dur": 2.709, "args": { "External id": 12906,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065286.068, "dur": 0.520, "args": { "External id": 12907,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065288.178, "dur": 0.883, "args": { "External id": 12908,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065293.506, "dur": 2.470, "args": { "External id": 12909,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065297.878, "dur": 0.450, "args": { "External id": 12910,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065300.948, "dur": 0.459, "args": { "External id": 12911,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065305.618, "dur": 0.774, "args": { "External id": 12912,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065308.595, "dur": 0.599, "args": { "External id": 12913,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650065311.391, "dur": 2.567, "args": { "External id": 12914,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650065336.342, "dur": 30.462, "args": { "External id": 12915,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6410 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650065445.112, "dur": 297.467, "args": { "External id": 12916,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6411 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650065482.126, "dur": 255.074, "args": { "External id": 12917,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6412, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650065497.023, "dur": 232.999, "args": { "External id": 12918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6413 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650065768.214, "dur": 2.214, "args": { "External id": 12919,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6414, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.5)", "pid": 1336757, "tid": 1336757, "ts": 1295650065861.383, "dur": 16855.472, "args": { "External id": 12920,"Record function id": 0, "Ev Idx": 6415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650065964.500, "dur": 6.051, "args": { "External id": 12921,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650065974.023, "dur": 1.423, "args": { "External id": 12922,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650065977.401, "dur": 1.772, "args": { "External id": 12923,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650065981.111, "dur": 0.864, "args": { "External id": 12924,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650065983.606, "dur": 38.415, "args": { "External id": 12925,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650066026.340, "dur": 1.483, "args": { "External id": 12926,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650066032.346, "dur": 0.867, "args": { "External id": 12927,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650066034.793, "dur": 2.258, "args": { "External id": 12928,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650066038.734, "dur": 0.748, "args": { "External id": 12929,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650066040.849, "dur": 0.641, "args": { "External id": 12930,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6425 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650066063.379, "dur": 16598.474, "args": { "External id": 12931,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650066086.518, "dur": 16566.109, "args": { "External id": 12932,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650066107.562, "dur": 15.610, "args": { "External id": 12933,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650066126.221, "dur": 16487.799, "args": { "External id": 12934,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650066129.108, "dur": 16483.973, "args": { "External id": 12935,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650066135.599, "dur": 5.801, "args": { "External id": 12936,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650066143.421, "dur": 16465.194, "args": { "External id": 12937,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6432 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650082861.462, "dur": 38.980, "args": { "External id": 12938,"Sequence number": 246551, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6433 } }, { "ph": "s", "id": 217, "pid": 1336757, "tid": 1336757, "ts": 1295650082861.462, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650082885.647, "dur": 9.992, "args": { "External id": 12939,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650082889.962, "dur": 5.480, "args": { "External id": 12940,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6435 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650082967.949, "dur": 112.289, "args": { "External id": 12941,"Record function id": 0, "Ev Idx": 6436 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650083083.280, "dur": 1221.322, "args": { "External id": 12942,"Record function id": 0, "Ev Idx": 6437 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650083124.855, "dur": 1160.387, "args": { "External id": 12943,"Sequence number": 246552, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6438 } }, { "ph": "s", "id": 216, "pid": 1336757, "tid": 1336757, "ts": 1295650083124.855, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650083201.793, "dur": 69.963, "args": { "External id": 12944,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650083294.529, "dur": 115.458, "args": { "External id": 12945,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650083422.624, "dur": 40.090, "args": { "External id": 12946,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650083471.591, "dur": 30.659, "args": { "External id": 12947,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6442 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650083535.997, "dur": 32.531, "args": { "External id": 12948,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6443 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650083591.771, "dur": 15.846, "args": { "External id": 12949,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6444 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650083633.406, "dur": 143.640, "args": { "External id": 12950,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650083691.721, "dur": 12.139, "args": { "External id": 12951,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650083696.794, "dur": 6.062, "args": { "External id": 12952,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650083707.054, "dur": 5.739, "args": { "External id": 12953,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650083714.038, "dur": 1.332, "args": { "External id": 12954,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650083718.265, "dur": 4.985, "args": { "External id": 12955,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650083787.489, "dur": 48.774, "args": { "External id": 12956,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6451 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650083870.982, "dur": 32.224, "args": { "External id": 12957,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650083912.444, "dur": 41.621, "args": { "External id": 12958,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650083963.439, "dur": 76.181, "args": { "External id": 12959,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6454 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650084065.744, "dur": 27.440, "args": { "External id": 12960,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650084100.060, "dur": 39.009, "args": { "External id": 12961,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6456 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650084162.831, "dur": 22.397, "args": { "External id": 12962,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6457 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.5)", "pid": 1336757, "tid": 1336757, "ts": 1295650084383.076, "dur": 85.956, "args": { "External id": 12963,"Record function id": 0, "Ev Idx": 6458 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650084545.141, "dur": 47.466, "args": { "External id": 12964,"Record function id": 0, "Ev Idx": 6459 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.6)", "pid": 1336757, "tid": 1336757, "ts": 1295650084601.777, "dur": 17972.105, "args": { "External id": 12965,"Record function id": 0, "Ev Idx": 6460 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.6)", "pid": 1336757, "tid": 1336757, "ts": 1295650084610.581, "dur": 925.439, "args": { "External id": 12966,"Record function id": 0, "Ev Idx": 6461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650084694.776, "dur": 9.961, "args": { "External id": 12967,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650084717.877, "dur": 37.574, "args": { "External id": 12968,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084723.886, "dur": 2.484, "args": { "External id": 12969,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084731.339, "dur": 0.307, "args": { "External id": 12970,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084733.274, "dur": 0.328, "args": { "External id": 12971,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084735.207, "dur": 0.363, "args": { "External id": 12972,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084738.333, "dur": 0.614, "args": { "External id": 12973,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084740.748, "dur": 0.396, "args": { "External id": 12974,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084742.449, "dur": 3.271, "args": { "External id": 12975,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084747.324, "dur": 0.173, "args": { "External id": 12976,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084748.782, "dur": 0.139, "args": { "External id": 12977,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650084767.089, "dur": 44.432, "args": { "External id": 12978,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6473 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650084843.898, "dur": 110.039, "args": { "External id": 12979,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650084855.257, "dur": 4.399, "args": { "External id": 12980,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650084864.655, "dur": 10.833, "args": { "External id": 12981,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650084869.520, "dur": 5.558, "args": { "External id": 12982,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084873.405, "dur": 0.452, "args": { "External id": 12983,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650084882.056, "dur": 31.127, "args": { "External id": 12984,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084883.896, "dur": 2.621, "args": { "External id": 12985,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084887.845, "dur": 0.335, "args": { "External id": 12986,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084889.240, "dur": 0.277, "args": { "External id": 12987,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084893.918, "dur": 1.985, "args": { "External id": 12988,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084897.352, "dur": 0.430, "args": { "External id": 12989,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084899.663, "dur": 0.293, "args": { "External id": 12990,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084902.909, "dur": 0.317, "args": { "External id": 12991,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084904.862, "dur": 0.381, "args": { "External id": 12992,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650084906.705, "dur": 2.348, "args": { "External id": 12993,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650084924.544, "dur": 21.760, "args": { "External id": 12994,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6489 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650085053.471, "dur": 362.373, "args": { "External id": 12995,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6490 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650085089.035, "dur": 320.530, "args": { "External id": 12996,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6491, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650085101.609, "dur": 301.183, "args": { "External id": 12997,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6492 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650085446.629, "dur": 6.574, "args": { "External id": 12998,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6493, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.6)", "pid": 1336757, "tid": 1336757, "ts": 1295650085557.444, "dur": 16807.850, "args": { "External id": 12999,"Record function id": 0, "Ev Idx": 6494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650085660.471, "dur": 6.971, "args": { "External id": 13000,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650085670.868, "dur": 1.548, "args": { "External id": 13001,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650085674.196, "dur": 2.383, "args": { "External id": 13002,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650085679.165, "dur": 1.188, "args": { "External id": 13003,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650085681.612, "dur": 0.770, "args": { "External id": 13004,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650085683.769, "dur": 0.799, "args": { "External id": 13005,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650085688.160, "dur": 0.900, "args": { "External id": 13006,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650085690.695, "dur": 2.224, "args": { "External id": 13007,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650085694.393, "dur": 0.868, "args": { "External id": 13008,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650085697.114, "dur": 0.632, "args": { "External id": 13009,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6504 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650085718.253, "dur": 16594.714, "args": { "External id": 13010,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650085734.060, "dur": 16568.991, "args": { "External id": 13011,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650085757.210, "dur": 16.573, "args": { "External id": 13012,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650085777.002, "dur": 16481.835, "args": { "External id": 13013,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650085779.733, "dur": 16478.266, "args": { "External id": 13014,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650085786.955, "dur": 6.021, "args": { "External id": 13015,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650085794.763, "dur": 16459.622, "args": { "External id": 13016,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6511 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650102508.688, "dur": 39.580, "args": { "External id": 13017,"Sequence number": 246553, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6512 } }, { "ph": "s", "id": 215, "pid": 1336757, "tid": 1336757, "ts": 1295650102508.688, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650102532.739, "dur": 10.003, "args": { "External id": 13018,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650102537.337, "dur": 5.125, "args": { "External id": 13019,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6514 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650102612.348, "dur": 78.393, "args": { "External id": 13020,"Record function id": 0, "Ev Idx": 6515 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650102692.269, "dur": 1186.677, "args": { "External id": 13021,"Record function id": 0, "Ev Idx": 6516 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650102733.125, "dur": 1131.562, "args": { "External id": 13022,"Sequence number": 246554, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6517 } }, { "ph": "s", "id": 214, "pid": 1336757, "tid": 1336757, "ts": 1295650102733.125, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650102802.823, "dur": 44.995, "args": { "External id": 13023,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650102860.716, "dur": 105.323, "args": { "External id": 13024,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650102976.216, "dur": 81.064, "args": { "External id": 13025,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650103071.049, "dur": 33.124, "args": { "External id": 13026,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6521 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650103132.468, "dur": 27.674, "args": { "External id": 13027,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6522 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650103178.387, "dur": 17.240, "args": { "External id": 13028,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6523 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650103216.345, "dur": 184.106, "args": { "External id": 13029,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650103292.305, "dur": 16.214, "args": { "External id": 13030,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650103299.038, "dur": 8.289, "args": { "External id": 13031,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650103312.052, "dur": 7.173, "args": { "External id": 13032,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650103321.827, "dur": 1.885, "args": { "External id": 13033,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650103326.871, "dur": 6.569, "args": { "External id": 13034,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650103413.305, "dur": 59.922, "args": { "External id": 13035,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6530 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650103508.006, "dur": 35.039, "args": { "External id": 13036,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650103552.972, "dur": 41.638, "args": { "External id": 13037,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650103603.800, "dur": 34.557, "args": { "External id": 13038,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6533 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650103662.880, "dur": 33.816, "args": { "External id": 13039,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650103702.404, "dur": 39.531, "args": { "External id": 13040,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6535 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650103763.069, "dur": 19.308, "args": { "External id": 13041,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6536 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.6)", "pid": 1336757, "tid": 1336757, "ts": 1295650103948.594, "dur": 123.623, "args": { "External id": 13042,"Record function id": 0, "Ev Idx": 6537 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650104152.503, "dur": 46.439, "args": { "External id": 13043,"Record function id": 0, "Ev Idx": 6538 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.7)", "pid": 1336757, "tid": 1336757, "ts": 1295650104208.494, "dur": 17942.450, "args": { "External id": 13044,"Record function id": 0, "Ev Idx": 6539 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.7)", "pid": 1336757, "tid": 1336757, "ts": 1295650104217.674, "dur": 946.844, "args": { "External id": 13045,"Record function id": 0, "Ev Idx": 6540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650104331.360, "dur": 12.209, "args": { "External id": 13046,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650104361.111, "dur": 41.780, "args": { "External id": 13047,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104368.091, "dur": 2.782, "args": { "External id": 13048,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104376.417, "dur": 0.307, "args": { "External id": 13049,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104378.445, "dur": 0.479, "args": { "External id": 13050,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104380.421, "dur": 0.504, "args": { "External id": 13051,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104384.325, "dur": 0.535, "args": { "External id": 13052,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104386.194, "dur": 0.468, "args": { "External id": 13053,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104388.167, "dur": 3.857, "args": { "External id": 13054,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104393.501, "dur": 0.174, "args": { "External id": 13055,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104395.363, "dur": 0.229, "args": { "External id": 13056,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650104413.876, "dur": 45.718, "args": { "External id": 13057,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6552 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650104496.934, "dur": 114.601, "args": { "External id": 13058,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650104508.538, "dur": 4.690, "args": { "External id": 13059,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650104518.289, "dur": 10.821, "args": { "External id": 13060,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650104523.316, "dur": 5.374, "args": { "External id": 13061,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104526.998, "dur": 0.426, "args": { "External id": 13062,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650104536.299, "dur": 31.461, "args": { "External id": 13063,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104538.176, "dur": 2.919, "args": { "External id": 13064,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104542.583, "dur": 0.333, "args": { "External id": 13065,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104544.403, "dur": 0.389, "args": { "External id": 13066,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104548.756, "dur": 1.375, "args": { "External id": 13067,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104551.436, "dur": 0.262, "args": { "External id": 13068,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104553.012, "dur": 0.247, "args": { "External id": 13069,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104556.887, "dur": 0.278, "args": { "External id": 13070,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104559.171, "dur": 0.156, "args": { "External id": 13071,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650104560.837, "dur": 2.575, "args": { "External id": 13072,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650104580.667, "dur": 22.417, "args": { "External id": 13073,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6568 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650104668.888, "dur": 391.772, "args": { "External id": 13074,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6569 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650104703.251, "dur": 351.663, "args": { "External id": 13075,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6570, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650104715.199, "dur": 333.523, "args": { "External id": 13076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6571 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650105088.214, "dur": 2.385, "args": { "External id": 13077,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6572, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.7)", "pid": 1336757, "tid": 1336757, "ts": 1295650105185.818, "dur": 16721.942, "args": { "External id": 13078,"Record function id": 0, "Ev Idx": 6573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650105335.395, "dur": 7.809, "args": { "External id": 13079,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650105348.221, "dur": 1.679, "args": { "External id": 13080,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650105352.632, "dur": 2.852, "args": { "External id": 13081,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650105360.554, "dur": 1.167, "args": { "External id": 13082,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650105364.154, "dur": 1.058, "args": { "External id": 13083,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650105367.379, "dur": 0.873, "args": { "External id": 13084,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650105370.942, "dur": 1.243, "args": { "External id": 13085,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650105377.164, "dur": 2.455, "args": { "External id": 13086,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650105381.840, "dur": 0.812, "args": { "External id": 13087,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650105384.943, "dur": 0.800, "args": { "External id": 13088,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6583 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650105413.466, "dur": 16442.801, "args": { "External id": 13089,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650105434.936, "dur": 16412.794, "args": { "External id": 13090,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650105456.869, "dur": 14.644, "args": { "External id": 13091,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650105476.661, "dur": 16333.177, "args": { "External id": 13092,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650105482.780, "dur": 16325.640, "args": { "External id": 13093,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650105489.509, "dur": 5.600, "args": { "External id": 13094,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650105496.836, "dur": 16308.167, "args": { "External id": 13095,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6590 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650122079.646, "dur": 43.262, "args": { "External id": 13096,"Sequence number": 246555, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6591 } }, { "ph": "s", "id": 213, "pid": 1336757, "tid": 1336757, "ts": 1295650122079.646, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650122107.636, "dur": 9.811, "args": { "External id": 13097,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650122111.619, "dur": 5.494, "args": { "External id": 13098,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6593 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650122191.263, "dur": 108.646, "args": { "External id": 13099,"Record function id": 0, "Ev Idx": 6594 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650122304.469, "dur": 1228.937, "args": { "External id": 13100,"Record function id": 0, "Ev Idx": 6595 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650122360.364, "dur": 1157.121, "args": { "External id": 13101,"Sequence number": 246556, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6596 } }, { "ph": "s", "id": 212, "pid": 1336757, "tid": 1336757, "ts": 1295650122360.364, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650122446.062, "dur": 49.796, "args": { "External id": 13102,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650122509.916, "dur": 104.805, "args": { "External id": 13103,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650122625.210, "dur": 39.414, "args": { "External id": 13104,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650122674.295, "dur": 31.381, "args": { "External id": 13105,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6600 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650122733.495, "dur": 27.644, "args": { "External id": 13106,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6601 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650122780.139, "dur": 16.853, "args": { "External id": 13107,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6602 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650122817.828, "dur": 140.510, "args": { "External id": 13108,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650122870.127, "dur": 12.265, "args": { "External id": 13109,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650122875.361, "dur": 5.942, "args": { "External id": 13110,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650122885.535, "dur": 6.546, "args": { "External id": 13111,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650122899.729, "dur": 1.186, "args": { "External id": 13112,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650122903.438, "dur": 4.189, "args": { "External id": 13113,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650122969.931, "dur": 92.999, "args": { "External id": 13114,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6609 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650123103.794, "dur": 29.591, "args": { "External id": 13115,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650123143.703, "dur": 44.935, "args": { "External id": 13116,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650123197.655, "dur": 54.780, "args": { "External id": 13117,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6612 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650123284.144, "dur": 38.185, "args": { "External id": 13118,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650123331.514, "dur": 56.182, "args": { "External id": 13119,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6614 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650123417.894, "dur": 22.408, "args": { "External id": 13120,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6615 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.7)", "pid": 1336757, "tid": 1336757, "ts": 1295650123603.222, "dur": 83.912, "args": { "External id": 13121,"Record function id": 0, "Ev Idx": 6616 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650123765.347, "dur": 48.524, "args": { "External id": 13122,"Record function id": 0, "Ev Idx": 6617 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.8)", "pid": 1336757, "tid": 1336757, "ts": 1295650123826.359, "dur": 17876.723, "args": { "External id": 13123,"Record function id": 0, "Ev Idx": 6618 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.8)", "pid": 1336757, "tid": 1336757, "ts": 1295650123834.933, "dur": 957.041, "args": { "External id": 13124,"Record function id": 0, "Ev Idx": 6619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650123919.002, "dur": 8.733, "args": { "External id": 13125,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650123940.479, "dur": 37.628, "args": { "External id": 13126,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650123946.270, "dur": 2.274, "args": { "External id": 13127,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650123953.196, "dur": 0.450, "args": { "External id": 13128,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650123955.288, "dur": 0.275, "args": { "External id": 13129,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650123956.659, "dur": 0.291, "args": { "External id": 13130,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650123960.939, "dur": 0.541, "args": { "External id": 13131,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650123962.505, "dur": 0.455, "args": { "External id": 13132,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650123964.806, "dur": 3.799, "args": { "External id": 13133,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650123969.730, "dur": 0.436, "args": { "External id": 13134,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650123971.779, "dur": 0.386, "args": { "External id": 13135,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650124032.397, "dur": 45.775, "args": { "External id": 13136,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6631 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650124113.631, "dur": 133.268, "args": { "External id": 13137,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650124126.272, "dur": 5.428, "args": { "External id": 13138,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650124137.089, "dur": 11.418, "args": { "External id": 13139,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650124141.882, "dur": 6.232, "args": { "External id": 13140,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650124145.818, "dur": 0.670, "args": { "External id": 13141,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650124155.885, "dur": 30.020, "args": { "External id": 13142,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650124158.078, "dur": 2.215, "args": { "External id": 13143,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650124162.268, "dur": 0.400, "args": { "External id": 13144,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650124164.222, "dur": 0.615, "args": { "External id": 13145,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650124167.675, "dur": 1.272, "args": { "External id": 13146,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650124170.587, "dur": 0.160, "args": { "External id": 13147,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650124172.082, "dur": 0.476, "args": { "External id": 13148,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650124176.352, "dur": 0.264, "args": { "External id": 13149,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650124178.165, "dur": 0.489, "args": { "External id": 13150,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650124180.095, "dur": 2.201, "args": { "External id": 13151,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650124197.371, "dur": 21.740, "args": { "External id": 13152,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6647 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650124322.967, "dur": 372.388, "args": { "External id": 13153,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6648 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650124364.636, "dur": 325.680, "args": { "External id": 13154,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6649, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650124379.663, "dur": 305.364, "args": { "External id": 13155,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6650 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650124719.578, "dur": 2.386, "args": { "External id": 13156,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6651, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.8)", "pid": 1336757, "tid": 1336757, "ts": 1295650124812.959, "dur": 16682.535, "args": { "External id": 13157,"Record function id": 0, "Ev Idx": 6652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650124910.783, "dur": 6.704, "args": { "External id": 13158,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650124920.977, "dur": 1.042, "args": { "External id": 13159,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650124923.802, "dur": 1.963, "args": { "External id": 13160,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650124927.891, "dur": 0.767, "args": { "External id": 13161,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650124930.091, "dur": 0.834, "args": { "External id": 13162,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650124932.165, "dur": 0.718, "args": { "External id": 13163,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650124937.275, "dur": 0.789, "args": { "External id": 13164,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650124939.957, "dur": 1.672, "args": { "External id": 13165,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650124943.309, "dur": 0.740, "args": { "External id": 13166,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650124945.501, "dur": 0.717, "args": { "External id": 13167,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6662 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650124978.326, "dur": 16465.392, "args": { "External id": 13168,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650125036.873, "dur": 16398.399, "args": { "External id": 13169,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650125058.191, "dur": 15.412, "args": { "External id": 13170,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650125076.700, "dur": 16320.426, "args": { "External id": 13171,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650125079.296, "dur": 16317.016, "args": { "External id": 13172,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650125085.100, "dur": 8.884, "args": { "External id": 13173,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650125095.825, "dur": 16296.906, "args": { "External id": 13174,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6669 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650141638.615, "dur": 39.074, "args": { "External id": 13175,"Sequence number": 246557, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6670 } }, { "ph": "s", "id": 211, "pid": 1336757, "tid": 1336757, "ts": 1295650141638.615, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650141662.626, "dur": 10.020, "args": { "External id": 13176,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650141666.638, "dur": 5.755, "args": { "External id": 13177,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6672 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650141743.055, "dur": 80.612, "args": { "External id": 13178,"Record function id": 0, "Ev Idx": 6673 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650141825.268, "dur": 1150.849, "args": { "External id": 13179,"Record function id": 0, "Ev Idx": 6674 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650141866.407, "dur": 1095.679, "args": { "External id": 13180,"Sequence number": 246558, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6675 } }, { "ph": "s", "id": 210, "pid": 1336757, "tid": 1336757, "ts": 1295650141866.407, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650141934.704, "dur": 41.869, "args": { "External id": 13181,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650142028.458, "dur": 96.456, "args": { "External id": 13182,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650142136.351, "dur": 37.280, "args": { "External id": 13183,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650142182.356, "dur": 31.067, "args": { "External id": 13184,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6679 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650142263.989, "dur": 37.892, "args": { "External id": 13185,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6680 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650142327.320, "dur": 23.242, "args": { "External id": 13186,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6681 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650142376.905, "dur": 142.985, "args": { "External id": 13187,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650142432.177, "dur": 14.280, "args": { "External id": 13188,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650142437.713, "dur": 7.734, "args": { "External id": 13189,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650142449.466, "dur": 6.145, "args": { "External id": 13190,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650142457.133, "dur": 1.260, "args": { "External id": 13191,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650142460.985, "dur": 4.666, "args": { "External id": 13192,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650142532.224, "dur": 59.962, "args": { "External id": 13193,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6688 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650142626.264, "dur": 28.853, "args": { "External id": 13194,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650142664.578, "dur": 42.974, "args": { "External id": 13195,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650142716.745, "dur": 35.164, "args": { "External id": 13196,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6691 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650142775.159, "dur": 29.055, "args": { "External id": 13197,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650142809.536, "dur": 34.175, "args": { "External id": 13198,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6693 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650142864.277, "dur": 20.843, "args": { "External id": 13199,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6694 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.8)", "pid": 1336757, "tid": 1336757, "ts": 1295650143083.064, "dur": 78.630, "args": { "External id": 13200,"Record function id": 0, "Ev Idx": 6695 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650143257.391, "dur": 60.116, "args": { "External id": 13201,"Record function id": 0, "Ev Idx": 6696 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.9)", "pid": 1336757, "tid": 1336757, "ts": 1295650143330.354, "dur": 17956.222, "args": { "External id": 13202,"Record function id": 0, "Ev Idx": 6697 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.9)", "pid": 1336757, "tid": 1336757, "ts": 1295650143342.044, "dur": 1004.017, "args": { "External id": 13203,"Record function id": 0, "Ev Idx": 6698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650143434.006, "dur": 11.525, "args": { "External id": 13204,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650143459.128, "dur": 39.225, "args": { "External id": 13205,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143465.300, "dur": 2.653, "args": { "External id": 13206,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143473.136, "dur": 0.400, "args": { "External id": 13207,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143474.872, "dur": 0.338, "args": { "External id": 13208,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143476.676, "dur": 0.352, "args": { "External id": 13209,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143479.827, "dur": 0.360, "args": { "External id": 13210,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143481.889, "dur": 0.560, "args": { "External id": 13211,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143483.973, "dur": 3.752, "args": { "External id": 13212,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143489.840, "dur": 0.303, "args": { "External id": 13213,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143491.536, "dur": 0.556, "args": { "External id": 13214,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650143509.104, "dur": 45.498, "args": { "External id": 13215,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6710 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650143589.143, "dur": 123.625, "args": { "External id": 13216,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650143600.253, "dur": 4.506, "args": { "External id": 13217,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650143609.792, "dur": 10.800, "args": { "External id": 13218,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650143614.851, "dur": 5.312, "args": { "External id": 13219,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143618.508, "dur": 0.431, "args": { "External id": 13220,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650143627.245, "dur": 35.368, "args": { "External id": 13221,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143629.164, "dur": 2.774, "args": { "External id": 13222,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143638.143, "dur": 0.445, "args": { "External id": 13223,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143639.671, "dur": 0.186, "args": { "External id": 13224,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143643.365, "dur": 1.459, "args": { "External id": 13225,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143646.100, "dur": 0.564, "args": { "External id": 13226,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143648.373, "dur": 2.247, "args": { "External id": 13227,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143651.480, "dur": 0.430, "args": { "External id": 13228,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143653.754, "dur": 0.294, "args": { "External id": 13229,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650143657.876, "dur": 0.299, "args": { "External id": 13230,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650143682.518, "dur": 22.542, "args": { "External id": 13231,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6726 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650143767.119, "dur": 436.280, "args": { "External id": 13232,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6727 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650143798.151, "dur": 399.408, "args": { "External id": 13233,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6728, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650143814.930, "dur": 376.467, "args": { "External id": 13234,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6729 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650144249.524, "dur": 4.188, "args": { "External id": 13235,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6730, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.9)", "pid": 1336757, "tid": 1336757, "ts": 1295650144373.939, "dur": 16677.296, "args": { "External id": 13236,"Record function id": 0, "Ev Idx": 6731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650144492.242, "dur": 7.535, "args": { "External id": 13237,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650144503.625, "dur": 0.926, "args": { "External id": 13238,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650144506.508, "dur": 1.880, "args": { "External id": 13239,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650144510.724, "dur": 0.824, "args": { "External id": 13240,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650144513.097, "dur": 0.453, "args": { "External id": 13241,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650144514.800, "dur": 0.872, "args": { "External id": 13242,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650144520.042, "dur": 0.831, "args": { "External id": 13243,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650144522.539, "dur": 1.755, "args": { "External id": 13244,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650144526.258, "dur": 0.687, "args": { "External id": 13245,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650144528.395, "dur": 1.059, "args": { "External id": 13246,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6741 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650144553.787, "dur": 16422.657, "args": { "External id": 13247,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650144570.886, "dur": 16396.774, "args": { "External id": 13248,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650144592.905, "dur": 14.490, "args": { "External id": 13249,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650144613.838, "dur": 16316.349, "args": { "External id": 13250,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650144616.291, "dur": 16313.098, "args": { "External id": 13251,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650144622.513, "dur": 5.623, "args": { "External id": 13252,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650144629.873, "dur": 16295.898, "args": { "External id": 13253,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6748 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650161196.982, "dur": 54.373, "args": { "External id": 13254,"Sequence number": 246559, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6749 } }, { "ph": "s", "id": 209, "pid": 1336757, "tid": 1336757, "ts": 1295650161196.982, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650161220.679, "dur": 23.903, "args": { "External id": 13255,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650161224.479, "dur": 19.243, "args": { "External id": 13256,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6751 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650161339.849, "dur": 90.255, "args": { "External id": 13257,"Record function id": 0, "Ev Idx": 6752 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650161432.074, "dur": 1188.103, "args": { "External id": 13258,"Record function id": 0, "Ev Idx": 6753 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650161477.994, "dur": 1126.736, "args": { "External id": 13259,"Sequence number": 246560, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6754 } }, { "ph": "s", "id": 208, "pid": 1336757, "tid": 1336757, "ts": 1295650161477.994, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650161553.354, "dur": 48.336, "args": { "External id": 13260,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650161615.011, "dur": 103.840, "args": { "External id": 13261,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650161728.212, "dur": 38.864, "args": { "External id": 13262,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650161775.962, "dur": 31.044, "args": { "External id": 13263,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6758 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650161832.660, "dur": 26.376, "args": { "External id": 13264,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6759 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650161877.154, "dur": 15.496, "args": { "External id": 13265,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6760 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650161912.107, "dur": 179.091, "args": { "External id": 13266,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650161963.287, "dur": 12.078, "args": { "External id": 13267,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650161968.458, "dur": 5.881, "args": { "External id": 13268,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650161978.804, "dur": 45.885, "args": { "External id": 13269,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650162027.396, "dur": 1.797, "args": { "External id": 13270,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650162032.527, "dur": 4.677, "args": { "External id": 13271,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650162103.554, "dur": 52.915, "args": { "External id": 13272,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6767 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650162189.932, "dur": 30.034, "args": { "External id": 13273,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650162254.901, "dur": 62.810, "args": { "External id": 13274,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650162332.020, "dur": 51.648, "args": { "External id": 13275,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6770 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650162415.411, "dur": 29.558, "args": { "External id": 13276,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650162452.256, "dur": 39.841, "args": { "External id": 13277,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6772 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650162513.527, "dur": 19.432, "args": { "External id": 13278,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6773 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.9)", "pid": 1336757, "tid": 1336757, "ts": 1295650162689.300, "dur": 80.866, "args": { "External id": 13279,"Record function id": 0, "Ev Idx": 6774 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650162844.408, "dur": 46.450, "args": { "External id": 13280,"Record function id": 0, "Ev Idx": 6775 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.10)", "pid": 1336757, "tid": 1336757, "ts": 1295650162899.898, "dur": 17817.465, "args": { "External id": 13281,"Record function id": 0, "Ev Idx": 6776 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.10)", "pid": 1336757, "tid": 1336757, "ts": 1295650162908.909, "dur": 991.692, "args": { "External id": 13282,"Record function id": 0, "Ev Idx": 6777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650163034.262, "dur": 10.501, "args": { "External id": 13283,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650163058.936, "dur": 38.815, "args": { "External id": 13284,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163064.778, "dur": 2.551, "args": { "External id": 13285,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163072.875, "dur": 0.440, "args": { "External id": 13286,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163074.831, "dur": 0.165, "args": { "External id": 13287,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163077.107, "dur": 0.337, "args": { "External id": 13288,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163080.811, "dur": 0.421, "args": { "External id": 13289,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163082.542, "dur": 0.282, "args": { "External id": 13290,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163084.240, "dur": 3.761, "args": { "External id": 13291,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163089.485, "dur": 0.443, "args": { "External id": 13292,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163091.300, "dur": 0.241, "args": { "External id": 13293,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650163110.324, "dur": 42.075, "args": { "External id": 13294,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6789 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650163186.826, "dur": 156.567, "args": { "External id": 13295,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650163197.941, "dur": 5.040, "args": { "External id": 13296,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650163208.441, "dur": 10.082, "args": { "External id": 13297,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650163212.774, "dur": 5.322, "args": { "External id": 13298,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163216.336, "dur": 0.544, "args": { "External id": 13299,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650163224.956, "dur": 57.823, "args": { "External id": 13300,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163244.276, "dur": 3.165, "args": { "External id": 13301,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163250.567, "dur": 0.407, "args": { "External id": 13302,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163253.007, "dur": 0.520, "args": { "External id": 13303,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163258.249, "dur": 1.971, "args": { "External id": 13304,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163262.105, "dur": 0.286, "args": { "External id": 13305,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163264.671, "dur": 0.274, "args": { "External id": 13306,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163269.397, "dur": 0.716, "args": { "External id": 13307,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163272.307, "dur": 0.313, "args": { "External id": 13308,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650163274.435, "dur": 2.401, "args": { "External id": 13309,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650163299.875, "dur": 32.791, "args": { "External id": 13310,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6805 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650163408.809, "dur": 393.799, "args": { "External id": 13311,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6806 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650163441.963, "dur": 356.274, "args": { "External id": 13312,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6807, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650163486.794, "dur": 306.116, "args": { "External id": 13313,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6808 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650163826.439, "dur": 2.106, "args": { "External id": 13314,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6809, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.10)", "pid": 1336757, "tid": 1336757, "ts": 1295650163921.681, "dur": 16585.179, "args": { "External id": 13315,"Record function id": 0, "Ev Idx": 6810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650164062.779, "dur": 7.252, "args": { "External id": 13316,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650164073.744, "dur": 1.246, "args": { "External id": 13317,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650164076.829, "dur": 2.203, "args": { "External id": 13318,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650164080.812, "dur": 1.073, "args": { "External id": 13319,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650164083.204, "dur": 0.798, "args": { "External id": 13320,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650164085.070, "dur": 0.718, "args": { "External id": 13321,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650164090.072, "dur": 0.872, "args": { "External id": 13322,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650164092.752, "dur": 1.902, "args": { "External id": 13323,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650164095.940, "dur": 0.694, "args": { "External id": 13324,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650164098.263, "dur": 0.668, "args": { "External id": 13325,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6820 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650164120.791, "dur": 16336.015, "args": { "External id": 13326,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650164137.411, "dur": 16309.592, "args": { "External id": 13327,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650164158.656, "dur": 15.251, "args": { "External id": 13328,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650164177.026, "dur": 16232.052, "args": { "External id": 13329,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650164179.486, "dur": 16228.823, "args": { "External id": 13330,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650164185.893, "dur": 5.725, "args": { "External id": 13331,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650164193.587, "dur": 16210.989, "args": { "External id": 13332,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6827 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650180650.875, "dur": 40.904, "args": { "External id": 13333,"Sequence number": 246561, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6828 } }, { "ph": "s", "id": 207, "pid": 1336757, "tid": 1336757, "ts": 1295650180650.875, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650180677.083, "dur": 9.635, "args": { "External id": 13334,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650180681.406, "dur": 5.087, "args": { "External id": 13335,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6830 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650180757.601, "dur": 77.902, "args": { "External id": 13336,"Record function id": 0, "Ev Idx": 6831 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650180837.195, "dur": 1192.346, "args": { "External id": 13337,"Record function id": 0, "Ev Idx": 6832 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650180875.332, "dur": 1102.586, "args": { "External id": 13338,"Sequence number": 246562, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6833 } }, { "ph": "s", "id": 206, "pid": 1336757, "tid": 1336757, "ts": 1295650180875.332, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650180942.850, "dur": 78.993, "args": { "External id": 13339,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650181038.577, "dur": 95.346, "args": { "External id": 13340,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650181145.133, "dur": 38.121, "args": { "External id": 13341,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650181192.636, "dur": 31.177, "args": { "External id": 13342,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6837 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650181277.774, "dur": 35.786, "args": { "External id": 13343,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6838 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650181340.521, "dur": 21.594, "args": { "External id": 13344,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6839 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650181388.056, "dur": 150.181, "args": { "External id": 13345,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650181449.736, "dur": 15.250, "args": { "External id": 13346,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650181456.938, "dur": 7.050, "args": { "External id": 13347,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650181468.101, "dur": 6.406, "args": { "External id": 13348,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650181475.873, "dur": 1.174, "args": { "External id": 13349,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650181479.111, "dur": 4.702, "args": { "External id": 13350,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650181550.637, "dur": 60.384, "args": { "External id": 13351,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6846 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650181643.473, "dur": 30.857, "args": { "External id": 13352,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650181683.870, "dur": 41.543, "args": { "External id": 13353,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650181734.304, "dur": 34.609, "args": { "External id": 13354,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6849 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650181793.976, "dur": 27.772, "args": { "External id": 13355,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650181827.428, "dur": 33.898, "args": { "External id": 13356,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6851 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650181882.183, "dur": 20.740, "args": { "External id": 13357,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6852 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.10)", "pid": 1336757, "tid": 1336757, "ts": 1295650182098.714, "dur": 79.182, "args": { "External id": 13358,"Record function id": 0, "Ev Idx": 6853 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650182281.388, "dur": 60.780, "args": { "External id": 13359,"Record function id": 0, "Ev Idx": 6854 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.11)", "pid": 1336757, "tid": 1336757, "ts": 1295650182354.560, "dur": 17777.880, "args": { "External id": 13360,"Record function id": 0, "Ev Idx": 6855 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.11)", "pid": 1336757, "tid": 1336757, "ts": 1295650182364.289, "dur": 986.413, "args": { "External id": 13361,"Record function id": 0, "Ev Idx": 6856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650182455.767, "dur": 11.644, "args": { "External id": 13362,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650182480.898, "dur": 39.944, "args": { "External id": 13363,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182487.270, "dur": 2.667, "args": { "External id": 13364,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182494.337, "dur": 0.320, "args": { "External id": 13365,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182496.604, "dur": 0.390, "args": { "External id": 13366,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182498.637, "dur": 0.369, "args": { "External id": 13367,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182502.450, "dur": 0.380, "args": { "External id": 13368,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182504.321, "dur": 0.529, "args": { "External id": 13369,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182506.733, "dur": 3.885, "args": { "External id": 13370,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182511.941, "dur": 0.379, "args": { "External id": 13371,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182514.096, "dur": 0.152, "args": { "External id": 13372,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650182536.444, "dur": 45.628, "args": { "External id": 13373,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6868 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650182615.609, "dur": 113.069, "args": { "External id": 13374,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650182626.937, "dur": 5.943, "args": { "External id": 13375,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650182637.942, "dur": 10.907, "args": { "External id": 13376,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650182642.982, "dur": 5.476, "args": { "External id": 13377,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182646.455, "dur": 0.643, "args": { "External id": 13378,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650182656.356, "dur": 27.469, "args": { "External id": 13379,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182658.552, "dur": 0.453, "args": { "External id": 13380,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182660.311, "dur": 2.485, "args": { "External id": 13381,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182664.430, "dur": 0.341, "args": { "External id": 13382,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182665.878, "dur": 1.579, "args": { "External id": 13383,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182671.476, "dur": 0.194, "args": { "External id": 13384,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182672.757, "dur": 0.549, "args": { "External id": 13385,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182674.908, "dur": 0.364, "args": { "External id": 13386,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182677.892, "dur": 0.472, "args": { "External id": 13387,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650182679.803, "dur": 0.370, "args": { "External id": 13388,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650182697.064, "dur": 23.115, "args": { "External id": 13389,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6884 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650182783.081, "dur": 424.441, "args": { "External id": 13390,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6885 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650182814.049, "dur": 388.057, "args": { "External id": 13391,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6886, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650182825.631, "dur": 370.129, "args": { "External id": 13392,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6887 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650183256.128, "dur": 4.466, "args": { "External id": 13393,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6888, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.11)", "pid": 1336757, "tid": 1336757, "ts": 1295650183378.688, "dur": 16509.476, "args": { "External id": 13394,"Record function id": 0, "Ev Idx": 6889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650183494.367, "dur": 7.397, "args": { "External id": 13395,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650183505.472, "dur": 1.465, "args": { "External id": 13396,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650183508.894, "dur": 2.344, "args": { "External id": 13397,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650183513.022, "dur": 0.816, "args": { "External id": 13398,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650183515.038, "dur": 0.721, "args": { "External id": 13399,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650183516.953, "dur": 0.913, "args": { "External id": 13400,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650183521.579, "dur": 1.184, "args": { "External id": 13401,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650183524.465, "dur": 1.826, "args": { "External id": 13402,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650183527.693, "dur": 0.846, "args": { "External id": 13403,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650183530.490, "dur": 1.129, "args": { "External id": 13404,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6899 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650183553.621, "dur": 16284.749, "args": { "External id": 13405,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650183569.786, "dur": 16259.765, "args": { "External id": 13406,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650183592.793, "dur": 14.048, "args": { "External id": 13407,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650183610.297, "dur": 16181.729, "args": { "External id": 13408,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650183612.621, "dur": 16178.522, "args": { "External id": 13409,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650183618.913, "dur": 5.284, "args": { "External id": 13410,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650183626.168, "dur": 16160.672, "args": { "External id": 13411,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6906 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650200061.766, "dur": 43.498, "args": { "External id": 13412,"Sequence number": 246563, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6907 } }, { "ph": "s", "id": 205, "pid": 1336757, "tid": 1336757, "ts": 1295650200061.766, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650200089.749, "dur": 10.110, "args": { "External id": 13413,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650200093.760, "dur": 5.716, "args": { "External id": 13414,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6909 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650200174.073, "dur": 102.414, "args": { "External id": 13415,"Record function id": 0, "Ev Idx": 6910 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650200280.813, "dur": 1189.331, "args": { "External id": 13416,"Record function id": 0, "Ev Idx": 6911 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650200334.798, "dur": 1120.103, "args": { "External id": 13417,"Sequence number": 246564, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6912 } }, { "ph": "s", "id": 204, "pid": 1336757, "tid": 1336757, "ts": 1295650200334.798, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650200413.755, "dur": 49.611, "args": { "External id": 13418,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650200477.020, "dur": 106.434, "args": { "External id": 13419,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650200594.355, "dur": 38.202, "args": { "External id": 13420,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650200641.797, "dur": 31.150, "args": { "External id": 13421,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6916 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650200699.171, "dur": 26.658, "args": { "External id": 13422,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6917 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650200744.186, "dur": 14.979, "args": { "External id": 13423,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6918 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650200779.563, "dur": 137.339, "args": { "External id": 13424,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650200833.857, "dur": 12.182, "args": { "External id": 13425,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650200839.029, "dur": 5.965, "args": { "External id": 13426,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650200848.986, "dur": 6.936, "args": { "External id": 13427,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650200857.536, "dur": 1.429, "args": { "External id": 13428,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650200861.221, "dur": 4.780, "args": { "External id": 13429,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650200927.981, "dur": 43.752, "args": { "External id": 13430,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6925 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650201046.759, "dur": 33.045, "args": { "External id": 13431,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650201090.191, "dur": 46.004, "args": { "External id": 13432,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650201145.370, "dur": 35.732, "args": { "External id": 13433,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6928 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650201204.262, "dur": 44.774, "args": { "External id": 13434,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650201259.292, "dur": 50.556, "args": { "External id": 13435,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6930 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650201337.752, "dur": 30.092, "args": { "External id": 13436,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6931 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.11)", "pid": 1336757, "tid": 1336757, "ts": 1295650201542.163, "dur": 80.448, "args": { "External id": 13437,"Record function id": 0, "Ev Idx": 6932 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650201698.641, "dur": 47.962, "args": { "External id": 13438,"Record function id": 0, "Ev Idx": 6933 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.12)", "pid": 1336757, "tid": 1336757, "ts": 1295650201755.052, "dur": 17916.891, "args": { "External id": 13439,"Record function id": 0, "Ev Idx": 6934 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.12)", "pid": 1336757, "tid": 1336757, "ts": 1295650201763.335, "dur": 944.334, "args": { "External id": 13440,"Record function id": 0, "Ev Idx": 6935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650201846.829, "dur": 9.918, "args": { "External id": 13441,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650201872.229, "dur": 37.832, "args": { "External id": 13442,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650201878.523, "dur": 2.566, "args": { "External id": 13443,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650201885.448, "dur": 0.687, "args": { "External id": 13444,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650201887.838, "dur": 0.180, "args": { "External id": 13445,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650201889.184, "dur": 2.690, "args": { "External id": 13446,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650201894.021, "dur": 0.324, "args": { "External id": 13447,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650201895.227, "dur": 0.387, "args": { "External id": 13448,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650201899.725, "dur": 1.363, "args": { "External id": 13449,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650201902.135, "dur": 0.161, "args": { "External id": 13450,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650201903.687, "dur": 0.204, "args": { "External id": 13451,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650201922.083, "dur": 39.474, "args": { "External id": 13452,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6947 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650202035.976, "dur": 119.937, "args": { "External id": 13453,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650202048.045, "dur": 6.639, "args": { "External id": 13454,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650202060.450, "dur": 13.557, "args": { "External id": 13455,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650202065.138, "dur": 8.452, "args": { "External id": 13456,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650202068.754, "dur": 3.163, "args": { "External id": 13457,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650202081.204, "dur": 28.125, "args": { "External id": 13458,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650202083.452, "dur": 0.644, "args": { "External id": 13459,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650202085.713, "dur": 0.491, "args": { "External id": 13460,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650202087.739, "dur": 0.253, "args": { "External id": 13461,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650202091.188, "dur": 2.179, "args": { "External id": 13462,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650202095.025, "dur": 0.524, "args": { "External id": 13463,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650202096.894, "dur": 1.278, "args": { "External id": 13464,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650202099.819, "dur": 0.210, "args": { "External id": 13465,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650202101.049, "dur": 0.799, "args": { "External id": 13466,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650202105.413, "dur": 0.237, "args": { "External id": 13467,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650202121.546, "dur": 26.396, "args": { "External id": 13468,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6963 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650202211.283, "dur": 392.264, "args": { "External id": 13469,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6964 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650202264.051, "dur": 332.910, "args": { "External id": 13470,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6965, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650202279.047, "dur": 312.203, "args": { "External id": 13471,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6966 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650202630.019, "dur": 2.977, "args": { "External id": 13472,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6967, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.12)", "pid": 1336757, "tid": 1336757, "ts": 1295650202729.797, "dur": 16733.333, "args": { "External id": 13473,"Record function id": 0, "Ev Idx": 6968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650202831.001, "dur": 6.500, "args": { "External id": 13474,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650202840.915, "dur": 1.239, "args": { "External id": 13475,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650202844.085, "dur": 2.724, "args": { "External id": 13476,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650202848.714, "dur": 0.780, "args": { "External id": 13477,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650202851.004, "dur": 0.649, "args": { "External id": 13478,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650202852.866, "dur": 0.790, "args": { "External id": 13479,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650202858.237, "dur": 0.783, "args": { "External id": 13480,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650202860.666, "dur": 1.765, "args": { "External id": 13481,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650202864.432, "dur": 0.870, "args": { "External id": 13482,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650202866.447, "dur": 0.611, "args": { "External id": 13483,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6978 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650202887.304, "dur": 16524.539, "args": { "External id": 13484,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650202903.919, "dur": 16499.410, "args": { "External id": 13485,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650202926.526, "dur": 14.510, "args": { "External id": 13486,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650202943.915, "dur": 16421.415, "args": { "External id": 13487,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650202946.649, "dur": 16417.789, "args": { "External id": 13488,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650202952.766, "dur": 5.332, "args": { "External id": 13489,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650202960.111, "dur": 16400.369, "args": { "External id": 13490,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6985 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650219606.705, "dur": 39.666, "args": { "External id": 13491,"Sequence number": 246565, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6986 } }, { "ph": "s", "id": 203, "pid": 1336757, "tid": 1336757, "ts": 1295650219606.705, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650219631.060, "dur": 10.329, "args": { "External id": 13492,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650219635.287, "dur": 5.814, "args": { "External id": 13493,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6988 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650219712.025, "dur": 76.012, "args": { "External id": 13494,"Record function id": 0, "Ev Idx": 6989 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650219789.766, "dur": 1151.235, "args": { "External id": 13495,"Record function id": 0, "Ev Idx": 6990 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650219829.997, "dur": 1097.256, "args": { "External id": 13496,"Sequence number": 246566, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6991 } }, { "ph": "s", "id": 202, "pid": 1336757, "tid": 1336757, "ts": 1295650219829.997, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650219897.778, "dur": 41.399, "args": { "External id": 13497,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650219951.832, "dur": 134.014, "args": { "External id": 13498,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650220101.325, "dur": 40.583, "args": { "External id": 13499,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650220151.807, "dur": 31.783, "args": { "External id": 13500,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6995 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650220211.565, "dur": 49.986, "args": { "External id": 13501,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6996 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650220289.776, "dur": 24.785, "args": { "External id": 13502,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6997 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650220339.874, "dur": 149.144, "args": { "External id": 13503,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650220401.595, "dur": 13.218, "args": { "External id": 13504,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650220406.901, "dur": 7.027, "args": { "External id": 13505,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650220417.701, "dur": 6.673, "args": { "External id": 13506,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650220425.641, "dur": 1.163, "args": { "External id": 13507,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650220429.380, "dur": 4.966, "args": { "External id": 13508,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650220501.106, "dur": 57.081, "args": { "External id": 13509,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7004 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650220591.033, "dur": 28.834, "args": { "External id": 13510,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650220629.040, "dur": 43.017, "args": { "External id": 13511,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650220680.824, "dur": 35.249, "args": { "External id": 13512,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7007 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650220747.933, "dur": 29.148, "args": { "External id": 13513,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650220784.657, "dur": 36.327, "args": { "External id": 13514,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7009 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650220839.343, "dur": 20.513, "args": { "External id": 13515,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7010 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.12)", "pid": 1336757, "tid": 1336757, "ts": 1295650221044.304, "dur": 78.990, "args": { "External id": 13516,"Record function id": 0, "Ev Idx": 7011 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650221201.791, "dur": 71.207, "args": { "External id": 13517,"Record function id": 0, "Ev Idx": 7012 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.13)", "pid": 1336757, "tid": 1336757, "ts": 1295650221286.595, "dur": 18093.247, "args": { "External id": 13518,"Record function id": 0, "Ev Idx": 7013 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.13)", "pid": 1336757, "tid": 1336757, "ts": 1295650221298.255, "dur": 916.680, "args": { "External id": 13519,"Record function id": 0, "Ev Idx": 7014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650221397.639, "dur": 12.566, "args": { "External id": 13520,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650221426.145, "dur": 37.139, "args": { "External id": 13521,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221431.718, "dur": 2.780, "args": { "External id": 13522,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221439.354, "dur": 0.522, "args": { "External id": 13523,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221441.289, "dur": 0.440, "args": { "External id": 13524,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221443.436, "dur": 0.292, "args": { "External id": 13525,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221446.323, "dur": 0.245, "args": { "External id": 13526,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221447.882, "dur": 0.481, "args": { "External id": 13527,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221449.359, "dur": 4.397, "args": { "External id": 13528,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221455.781, "dur": 0.468, "args": { "External id": 13529,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221457.055, "dur": 0.225, "args": { "External id": 13530,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650221474.974, "dur": 46.122, "args": { "External id": 13531,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7026 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650221554.862, "dur": 111.556, "args": { "External id": 13532,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650221566.131, "dur": 4.182, "args": { "External id": 13533,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650221575.537, "dur": 10.622, "args": { "External id": 13534,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650221580.241, "dur": 5.535, "args": { "External id": 13535,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221583.861, "dur": 0.719, "args": { "External id": 13536,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650221592.728, "dur": 30.885, "args": { "External id": 13537,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221594.899, "dur": 2.554, "args": { "External id": 13538,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221599.403, "dur": 0.405, "args": { "External id": 13539,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221600.872, "dur": 0.405, "args": { "External id": 13540,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221605.043, "dur": 1.397, "args": { "External id": 13541,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221607.907, "dur": 0.313, "args": { "External id": 13542,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221609.837, "dur": 0.487, "args": { "External id": 13543,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221613.326, "dur": 0.516, "args": { "External id": 13544,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221615.626, "dur": 0.178, "args": { "External id": 13545,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650221617.328, "dur": 2.609, "args": { "External id": 13546,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650221636.565, "dur": 21.769, "args": { "External id": 13547,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7042 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650221721.512, "dur": 390.632, "args": { "External id": 13548,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7043 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650221755.141, "dur": 351.332, "args": { "External id": 13549,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7044, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650221765.550, "dur": 333.669, "args": { "External id": 13550,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7045 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650222139.922, "dur": 3.084, "args": { "External id": 13551,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7046, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.13)", "pid": 1336757, "tid": 1336757, "ts": 1295650222258.355, "dur": 16878.495, "args": { "External id": 13552,"Record function id": 0, "Ev Idx": 7047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650222388.072, "dur": 8.302, "args": { "External id": 13553,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650222400.561, "dur": 1.361, "args": { "External id": 13554,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650222403.699, "dur": 2.966, "args": { "External id": 13555,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650222408.960, "dur": 1.104, "args": { "External id": 13556,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650222411.361, "dur": 0.759, "args": { "External id": 13557,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650222415.409, "dur": 0.721, "args": { "External id": 13558,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650222417.831, "dur": 0.454, "args": { "External id": 13559,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650222419.871, "dur": 1.807, "args": { "External id": 13560,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650222423.070, "dur": 0.652, "args": { "External id": 13561,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650222427.420, "dur": 0.555, "args": { "External id": 13562,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7057 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650222447.622, "dur": 16638.857, "args": { "External id": 13563,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650222464.063, "dur": 16613.763, "args": { "External id": 13564,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650222488.392, "dur": 15.696, "args": { "External id": 13565,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650222507.010, "dur": 16532.818, "args": { "External id": 13566,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650222510.000, "dur": 16528.954, "args": { "External id": 13567,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650222516.481, "dur": 5.762, "args": { "External id": 13568,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650222523.824, "dur": 16511.518, "args": { "External id": 13569,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7064 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650239304.765, "dur": 43.701, "args": { "External id": 13570,"Sequence number": 246567, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7065 } }, { "ph": "s", "id": 201, "pid": 1336757, "tid": 1336757, "ts": 1295650239304.765, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650239332.064, "dur": 10.795, "args": { "External id": 13571,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650239336.549, "dur": 5.924, "args": { "External id": 13572,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7067 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650239421.379, "dur": 78.418, "args": { "External id": 13573,"Record function id": 0, "Ev Idx": 7068 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650239501.488, "dur": 1172.757, "args": { "External id": 13574,"Record function id": 0, "Ev Idx": 7069 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650239540.978, "dur": 1118.000, "args": { "External id": 13575,"Sequence number": 246568, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7070 } }, { "ph": "s", "id": 200, "pid": 1336757, "tid": 1336757, "ts": 1295650239540.978, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650239613.992, "dur": 49.148, "args": { "External id": 13576,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650239676.886, "dur": 105.614, "args": { "External id": 13577,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650239792.426, "dur": 39.848, "args": { "External id": 13578,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650239840.886, "dur": 30.816, "args": { "External id": 13579,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7074 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650239896.895, "dur": 29.606, "args": { "External id": 13580,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7075 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650239944.254, "dur": 16.183, "args": { "External id": 13581,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7076 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650239978.337, "dur": 180.054, "args": { "External id": 13582,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650240072.670, "dur": 13.155, "args": { "External id": 13583,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650240078.203, "dur": 6.507, "args": { "External id": 13584,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650240088.985, "dur": 6.842, "args": { "External id": 13585,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650240097.255, "dur": 1.174, "args": { "External id": 13586,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650240101.152, "dur": 4.265, "args": { "External id": 13587,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650240169.352, "dur": 52.980, "args": { "External id": 13588,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7083 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650240282.827, "dur": 40.815, "args": { "External id": 13589,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650240336.715, "dur": 56.430, "args": { "External id": 13590,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650240403.476, "dur": 37.516, "args": { "External id": 13591,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7086 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650240466.648, "dur": 28.945, "args": { "External id": 13592,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650240501.957, "dur": 37.923, "args": { "External id": 13593,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7088 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650240562.085, "dur": 21.156, "args": { "External id": 13594,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7089 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.13)", "pid": 1336757, "tid": 1336757, "ts": 1295650240742.229, "dur": 83.152, "args": { "External id": 13595,"Record function id": 0, "Ev Idx": 7090 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650240900.715, "dur": 45.082, "args": { "External id": 13596,"Record function id": 0, "Ev Idx": 7091 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.14)", "pid": 1336757, "tid": 1336757, "ts": 1295650240954.593, "dur": 18109.701, "args": { "External id": 13597,"Record function id": 0, "Ev Idx": 7092 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.14)", "pid": 1336757, "tid": 1336757, "ts": 1295650240963.453, "dur": 1015.261, "args": { "External id": 13598,"Record function id": 0, "Ev Idx": 7093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650241088.532, "dur": 10.100, "args": { "External id": 13599,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650241113.052, "dur": 45.060, "args": { "External id": 13600,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241124.696, "dur": 2.641, "args": { "External id": 13601,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241131.973, "dur": 0.798, "args": { "External id": 13602,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241133.840, "dur": 0.191, "args": { "External id": 13603,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241135.164, "dur": 2.660, "args": { "External id": 13604,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241138.846, "dur": 0.200, "args": { "External id": 13605,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241142.722, "dur": 0.343, "args": { "External id": 13606,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241145.822, "dur": 1.371, "args": { "External id": 13607,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241148.331, "dur": 0.344, "args": { "External id": 13608,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241149.462, "dur": 2.676, "args": { "External id": 13609,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650241170.177, "dur": 42.238, "args": { "External id": 13610,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7105 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650241271.389, "dur": 150.371, "args": { "External id": 13611,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650241286.449, "dur": 8.079, "args": { "External id": 13612,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650241301.356, "dur": 13.821, "args": { "External id": 13613,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650241306.575, "dur": 8.074, "args": { "External id": 13614,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241311.250, "dur": 1.323, "args": { "External id": 13615,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650241324.820, "dur": 36.734, "args": { "External id": 13616,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241327.692, "dur": 0.522, "args": { "External id": 13617,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241330.916, "dur": 0.604, "args": { "External id": 13618,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241333.525, "dur": 2.634, "args": { "External id": 13619,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241338.413, "dur": 1.411, "args": { "External id": 13620,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241341.412, "dur": 0.411, "args": { "External id": 13621,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241346.783, "dur": 0.373, "args": { "External id": 13622,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241348.703, "dur": 0.461, "args": { "External id": 13623,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241351.519, "dur": 0.456, "args": { "External id": 13624,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650241355.780, "dur": 0.446, "args": { "External id": 13625,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650241377.414, "dur": 34.200, "args": { "External id": 13626,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7121 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650241492.497, "dur": 390.853, "args": { "External id": 13627,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7122 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650241528.336, "dur": 349.886, "args": { "External id": 13628,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7123, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650241539.256, "dur": 333.897, "args": { "External id": 13629,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7124 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650241907.882, "dur": 2.848, "args": { "External id": 13630,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7125, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.14)", "pid": 1336757, "tid": 1336757, "ts": 1295650242040.785, "dur": 16769.558, "args": { "External id": 13631,"Record function id": 0, "Ev Idx": 7126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650242145.503, "dur": 6.850, "args": { "External id": 13632,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650242155.631, "dur": 1.177, "args": { "External id": 13633,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650242158.364, "dur": 2.900, "args": { "External id": 13634,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650242162.886, "dur": 0.962, "args": { "External id": 13635,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650242165.180, "dur": 0.718, "args": { "External id": 13636,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650242166.945, "dur": 0.673, "args": { "External id": 13637,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650242171.393, "dur": 0.888, "args": { "External id": 13638,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650242174.567, "dur": 1.817, "args": { "External id": 13639,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650242177.808, "dur": 0.833, "args": { "External id": 13640,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650242180.643, "dur": 0.885, "args": { "External id": 13641,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7136 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650242201.834, "dur": 16556.244, "args": { "External id": 13642,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650242217.522, "dur": 16531.285, "args": { "External id": 13643,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650242259.353, "dur": 18.043, "args": { "External id": 13644,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650242281.483, "dur": 16429.619, "args": { "External id": 13645,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650242284.896, "dur": 16425.210, "args": { "External id": 13646,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650242292.284, "dur": 8.205, "args": { "External id": 13647,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650242302.720, "dur": 16403.594, "args": { "External id": 13648,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7143 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650258954.562, "dur": 80.924, "args": { "External id": 13649,"Sequence number": 246569, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7144 } }, { "ph": "s", "id": 199, "pid": 1336757, "tid": 1336757, "ts": 1295650258954.562, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650258978.781, "dur": 50.756, "args": { "External id": 13650,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650259022.858, "dur": 6.295, "args": { "External id": 13651,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7146 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650259105.727, "dur": 78.016, "args": { "External id": 13652,"Record function id": 0, "Ev Idx": 7147 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650259185.345, "dur": 1194.646, "args": { "External id": 13653,"Record function id": 0, "Ev Idx": 7148 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650259227.042, "dur": 1137.070, "args": { "External id": 13654,"Sequence number": 246570, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7149 } }, { "ph": "s", "id": 198, "pid": 1336757, "tid": 1336757, "ts": 1295650259227.042, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650259329.712, "dur": 55.761, "args": { "External id": 13655,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650259400.311, "dur": 108.465, "args": { "External id": 13656,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650259518.877, "dur": 40.063, "args": { "External id": 13657,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650259568.177, "dur": 30.948, "args": { "External id": 13658,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7153 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650259625.019, "dur": 25.535, "args": { "External id": 13659,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7154 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650259669.179, "dur": 15.382, "args": { "External id": 13660,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7155 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650259705.156, "dur": 144.896, "args": { "External id": 13661,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650259765.029, "dur": 12.954, "args": { "External id": 13662,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650259770.724, "dur": 6.114, "args": { "External id": 13663,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650259781.158, "dur": 6.209, "args": { "External id": 13664,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650259788.600, "dur": 1.422, "args": { "External id": 13665,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650259792.320, "dur": 4.879, "args": { "External id": 13666,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650259860.759, "dur": 44.149, "args": { "External id": 13667,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7162 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650259938.899, "dur": 28.788, "args": { "External id": 13668,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650259976.825, "dur": 84.584, "args": { "External id": 13669,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650260074.086, "dur": 36.827, "args": { "External id": 13670,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7165 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650260133.818, "dur": 29.406, "args": { "External id": 13671,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650260169.116, "dur": 34.664, "args": { "External id": 13672,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7167 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650260242.839, "dur": 32.085, "args": { "External id": 13673,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7168 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.14)", "pid": 1336757, "tid": 1336757, "ts": 1295650260449.085, "dur": 81.795, "args": { "External id": 13674,"Record function id": 0, "Ev Idx": 7169 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650260604.543, "dur": 47.070, "args": { "External id": 13675,"Record function id": 0, "Ev Idx": 7170 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.15)", "pid": 1336757, "tid": 1336757, "ts": 1295650260661.229, "dur": 17999.352, "args": { "External id": 13676,"Record function id": 0, "Ev Idx": 7171 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.15)", "pid": 1336757, "tid": 1336757, "ts": 1295650260669.659, "dur": 964.676, "args": { "External id": 13677,"Record function id": 0, "Ev Idx": 7172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650260750.416, "dur": 10.245, "args": { "External id": 13678,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650260774.505, "dur": 38.552, "args": { "External id": 13679,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260780.052, "dur": 2.621, "args": { "External id": 13680,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260787.838, "dur": 0.754, "args": { "External id": 13681,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260790.152, "dur": 0.289, "args": { "External id": 13682,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260791.716, "dur": 0.456, "args": { "External id": 13683,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260795.732, "dur": 0.602, "args": { "External id": 13684,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260797.278, "dur": 0.426, "args": { "External id": 13685,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260799.241, "dur": 3.774, "args": { "External id": 13686,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260804.373, "dur": 0.413, "args": { "External id": 13687,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260806.513, "dur": 0.592, "args": { "External id": 13688,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650260824.169, "dur": 39.106, "args": { "External id": 13689,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7184 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650260895.674, "dur": 164.775, "args": { "External id": 13690,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650260906.232, "dur": 4.444, "args": { "External id": 13691,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650260915.446, "dur": 10.152, "args": { "External id": 13692,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650260920.086, "dur": 5.047, "args": { "External id": 13693,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260923.336, "dur": 0.569, "args": { "External id": 13694,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650260932.160, "dur": 30.082, "args": { "External id": 13695,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260934.509, "dur": 2.351, "args": { "External id": 13696,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260938.242, "dur": 0.250, "args": { "External id": 13697,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260940.110, "dur": 0.631, "args": { "External id": 13698,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260944.002, "dur": 1.911, "args": { "External id": 13699,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260947.134, "dur": 0.570, "args": { "External id": 13700,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260948.850, "dur": 0.169, "args": { "External id": 13701,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260952.798, "dur": 0.516, "args": { "External id": 13702,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260954.357, "dur": 0.325, "args": { "External id": 13703,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650260955.918, "dur": 2.493, "args": { "External id": 13704,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650260984.007, "dur": 66.070, "args": { "External id": 13705,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7200 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650261118.473, "dur": 404.206, "args": { "External id": 13706,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7201 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650261153.084, "dur": 363.692, "args": { "External id": 13707,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7202, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650261166.104, "dur": 343.066, "args": { "External id": 13708,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7203 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650261550.419, "dur": 2.657, "args": { "External id": 13709,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7204, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.15)", "pid": 1336757, "tid": 1336757, "ts": 1295650261655.315, "dur": 16791.236, "args": { "External id": 13710,"Record function id": 0, "Ev Idx": 7205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650261761.328, "dur": 6.796, "args": { "External id": 13711,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650261771.736, "dur": 0.834, "args": { "External id": 13712,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650261774.589, "dur": 2.399, "args": { "External id": 13713,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650261779.068, "dur": 1.202, "args": { "External id": 13714,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650261781.916, "dur": 1.044, "args": { "External id": 13715,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650261784.286, "dur": 1.121, "args": { "External id": 13716,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650261789.772, "dur": 0.815, "args": { "External id": 13717,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650261792.088, "dur": 1.723, "args": { "External id": 13718,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650261795.182, "dur": 0.655, "args": { "External id": 13719,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650261798.062, "dur": 1.097, "args": { "External id": 13720,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7215 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650261820.621, "dur": 16574.923, "args": { "External id": 13721,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650261836.822, "dur": 16548.800, "args": { "External id": 13722,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650261858.078, "dur": 15.280, "args": { "External id": 13723,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650261876.587, "dur": 16470.635, "args": { "External id": 13724,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650261879.136, "dur": 16467.238, "args": { "External id": 13725,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650261885.178, "dur": 5.465, "args": { "External id": 13726,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650261892.654, "dur": 16449.593, "args": { "External id": 13727,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7222 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650278590.433, "dur": 45.160, "args": { "External id": 13728,"Sequence number": 246571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7223 } }, { "ph": "s", "id": 197, "pid": 1336757, "tid": 1336757, "ts": 1295650278590.433, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650278619.944, "dur": 10.560, "args": { "External id": 13729,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650278624.256, "dur": 5.949, "args": { "External id": 13730,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7225 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650278700.019, "dur": 79.001, "args": { "External id": 13731,"Record function id": 0, "Ev Idx": 7226 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650278780.874, "dur": 1140.608, "args": { "External id": 13732,"Record function id": 0, "Ev Idx": 7227 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650278821.215, "dur": 1086.174, "args": { "External id": 13733,"Sequence number": 246572, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7228 } }, { "ph": "s", "id": 196, "pid": 1336757, "tid": 1336757, "ts": 1295650278821.215, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650278888.328, "dur": 43.481, "args": { "External id": 13734,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650278944.581, "dur": 133.497, "args": { "External id": 13735,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650279092.927, "dur": 41.565, "args": { "External id": 13736,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650279143.495, "dur": 30.888, "args": { "External id": 13737,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7232 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650279201.605, "dur": 43.993, "args": { "External id": 13738,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7233 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650279275.544, "dur": 24.973, "args": { "External id": 13739,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7234 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650279324.045, "dur": 148.778, "args": { "External id": 13740,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650279386.789, "dur": 13.437, "args": { "External id": 13741,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650279392.214, "dur": 7.092, "args": { "External id": 13742,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650279403.096, "dur": 6.016, "args": { "External id": 13743,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650279410.816, "dur": 1.444, "args": { "External id": 13744,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650279414.425, "dur": 4.888, "args": { "External id": 13745,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650279485.053, "dur": 59.678, "args": { "External id": 13746,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7241 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650279577.303, "dur": 29.326, "args": { "External id": 13747,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650279616.110, "dur": 41.879, "args": { "External id": 13748,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650279666.511, "dur": 35.306, "args": { "External id": 13749,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7244 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650279725.759, "dur": 25.835, "args": { "External id": 13750,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650279757.113, "dur": 33.691, "args": { "External id": 13751,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7246 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650279812.028, "dur": 22.044, "args": { "External id": 13752,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7247 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.15)", "pid": 1336757, "tid": 1336757, "ts": 1295650280027.776, "dur": 80.730, "args": { "External id": 13753,"Record function id": 0, "Ev Idx": 7248 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650280186.793, "dur": 66.792, "args": { "External id": 13754,"Record function id": 0, "Ev Idx": 7249 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.16)", "pid": 1336757, "tid": 1336757, "ts": 1295650280267.285, "dur": 17990.310, "args": { "External id": 13755,"Record function id": 0, "Ev Idx": 7250 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.16)", "pid": 1336757, "tid": 1336757, "ts": 1295650280279.124, "dur": 926.096, "args": { "External id": 13756,"Record function id": 0, "Ev Idx": 7251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650280376.026, "dur": 11.572, "args": { "External id": 13757,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650280402.466, "dur": 37.830, "args": { "External id": 13758,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280408.604, "dur": 2.413, "args": { "External id": 13759,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280415.400, "dur": 0.516, "args": { "External id": 13760,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280417.483, "dur": 0.685, "args": { "External id": 13761,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280419.268, "dur": 0.531, "args": { "External id": 13762,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280423.516, "dur": 0.394, "args": { "External id": 13763,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280425.003, "dur": 0.826, "args": { "External id": 13764,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280427.162, "dur": 3.809, "args": { "External id": 13765,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280432.169, "dur": 0.194, "args": { "External id": 13766,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280433.943, "dur": 0.506, "args": { "External id": 13767,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650280455.801, "dur": 48.856, "args": { "External id": 13768,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7263 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650280539.186, "dur": 112.434, "args": { "External id": 13769,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650280550.117, "dur": 6.761, "args": { "External id": 13770,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650280562.135, "dur": 10.763, "args": { "External id": 13771,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650280567.201, "dur": 5.042, "args": { "External id": 13772,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280570.582, "dur": 0.479, "args": { "External id": 13773,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650280579.654, "dur": 29.251, "args": { "External id": 13774,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280581.907, "dur": 0.527, "args": { "External id": 13775,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280583.453, "dur": 2.599, "args": { "External id": 13776,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280587.685, "dur": 0.476, "args": { "External id": 13777,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280589.484, "dur": 1.811, "args": { "External id": 13778,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280595.662, "dur": 0.495, "args": { "External id": 13779,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280597.409, "dur": 0.360, "args": { "External id": 13780,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280599.101, "dur": 0.169, "args": { "External id": 13781,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280602.550, "dur": 0.531, "args": { "External id": 13782,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650280604.489, "dur": 0.352, "args": { "External id": 13783,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650280620.445, "dur": 22.603, "args": { "External id": 13784,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7279 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650280704.864, "dur": 398.760, "args": { "External id": 13785,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7280 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650280739.160, "dur": 358.490, "args": { "External id": 13786,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7281, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650280749.723, "dur": 341.735, "args": { "External id": 13787,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7282 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650281131.411, "dur": 2.581, "args": { "External id": 13788,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7283, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.16)", "pid": 1336757, "tid": 1336757, "ts": 1295650281227.037, "dur": 16798.635, "args": { "External id": 13789,"Record function id": 0, "Ev Idx": 7284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650281375.495, "dur": 7.653, "args": { "External id": 13790,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650281388.052, "dur": 1.641, "args": { "External id": 13791,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650281392.402, "dur": 3.575, "args": { "External id": 13792,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650281398.248, "dur": 0.875, "args": { "External id": 13793,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650281400.712, "dur": 1.295, "args": { "External id": 13794,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650281402.928, "dur": 1.244, "args": { "External id": 13795,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650281408.154, "dur": 0.801, "args": { "External id": 13796,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650281410.466, "dur": 1.797, "args": { "External id": 13797,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650281414.181, "dur": 0.702, "args": { "External id": 13798,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650281416.139, "dur": 0.735, "args": { "External id": 13799,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7294 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650281438.962, "dur": 16511.322, "args": { "External id": 13800,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650281455.639, "dur": 16486.372, "args": { "External id": 13801,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650281480.858, "dur": 15.737, "args": { "External id": 13802,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650281499.814, "dur": 16403.871, "args": { "External id": 13803,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650281502.728, "dur": 16400.343, "args": { "External id": 13804,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650281509.059, "dur": 5.508, "args": { "External id": 13805,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650281516.310, "dur": 16383.147, "args": { "External id": 13806,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7301 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650298173.690, "dur": 39.406, "args": { "External id": 13807,"Sequence number": 246573, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7302 } }, { "ph": "s", "id": 195, "pid": 1336757, "tid": 1336757, "ts": 1295650298173.690, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650298198.021, "dur": 9.962, "args": { "External id": 13808,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650298202.168, "dur": 5.493, "args": { "External id": 13809,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7304 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650298307.074, "dur": 88.864, "args": { "External id": 13810,"Record function id": 0, "Ev Idx": 7305 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650298398.000, "dur": 1209.586, "args": { "External id": 13811,"Record function id": 0, "Ev Idx": 7306 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650298441.779, "dur": 1150.969, "args": { "External id": 13812,"Sequence number": 246574, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7307 } }, { "ph": "s", "id": 194, "pid": 1336757, "tid": 1336757, "ts": 1295650298441.779, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650298511.679, "dur": 47.543, "args": { "External id": 13813,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650298572.837, "dur": 105.836, "args": { "External id": 13814,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650298689.524, "dur": 37.986, "args": { "External id": 13815,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650298736.839, "dur": 31.262, "args": { "External id": 13816,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7311 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650298798.697, "dur": 28.375, "args": { "External id": 13817,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7312 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650298842.383, "dur": 16.061, "args": { "External id": 13818,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7313 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650298877.142, "dur": 180.371, "args": { "External id": 13819,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650298931.684, "dur": 12.194, "args": { "External id": 13820,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650298936.909, "dur": 6.141, "args": { "External id": 13821,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650298946.611, "dur": 5.938, "args": { "External id": 13822,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650298953.818, "dur": 1.096, "args": { "External id": 13823,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650298957.667, "dur": 6.515, "args": { "External id": 13824,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650299100.070, "dur": 57.318, "args": { "External id": 13825,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7320 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650299196.383, "dur": 30.665, "args": { "External id": 13826,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650299258.734, "dur": 62.371, "args": { "External id": 13827,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650299333.215, "dur": 43.609, "args": { "External id": 13828,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7323 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650299403.612, "dur": 32.247, "args": { "External id": 13829,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650299441.666, "dur": 34.705, "args": { "External id": 13830,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7325 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650299499.744, "dur": 19.306, "args": { "External id": 13831,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7326 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.16)", "pid": 1336757, "tid": 1336757, "ts": 1295650299676.651, "dur": 77.952, "args": { "External id": 13832,"Record function id": 0, "Ev Idx": 7327 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650299831.032, "dur": 44.818, "args": { "External id": 13833,"Record function id": 0, "Ev Idx": 7328 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.17)", "pid": 1336757, "tid": 1336757, "ts": 1295650299884.648, "dur": 18022.206, "args": { "External id": 13834,"Record function id": 0, "Ev Idx": 7329 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.17)", "pid": 1336757, "tid": 1336757, "ts": 1295650299894.823, "dur": 937.559, "args": { "External id": 13835,"Record function id": 0, "Ev Idx": 7330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650299980.298, "dur": 49.633, "args": { "External id": 13836,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650300046.970, "dur": 35.916, "args": { "External id": 13837,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300052.390, "dur": 2.502, "args": { "External id": 13838,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300059.204, "dur": 0.253, "args": { "External id": 13839,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300061.008, "dur": 0.442, "args": { "External id": 13840,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300063.173, "dur": 0.446, "args": { "External id": 13841,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300067.058, "dur": 0.561, "args": { "External id": 13842,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300069.168, "dur": 0.179, "args": { "External id": 13843,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300070.699, "dur": 2.983, "args": { "External id": 13844,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300074.989, "dur": 0.194, "args": { "External id": 13845,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300076.874, "dur": 0.170, "args": { "External id": 13846,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650300095.690, "dur": 43.003, "args": { "External id": 13847,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7342 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650300175.026, "dur": 154.684, "args": { "External id": 13848,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650300186.982, "dur": 4.511, "args": { "External id": 13849,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650300196.462, "dur": 10.978, "args": { "External id": 13850,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650300201.449, "dur": 5.582, "args": { "External id": 13851,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300205.389, "dur": 0.351, "args": { "External id": 13852,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650300214.165, "dur": 52.917, "args": { "External id": 13853,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300216.222, "dur": 2.601, "args": { "External id": 13854,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300220.164, "dur": 0.336, "args": { "External id": 13855,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300222.274, "dur": 0.515, "args": { "External id": 13856,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300226.896, "dur": 16.957, "args": { "External id": 13857,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300247.468, "dur": 0.405, "args": { "External id": 13858,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300249.919, "dur": 0.291, "args": { "External id": 13859,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300254.424, "dur": 0.290, "args": { "External id": 13860,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300256.749, "dur": 0.268, "args": { "External id": 13861,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650300258.928, "dur": 2.639, "args": { "External id": 13862,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650300286.554, "dur": 32.599, "args": { "External id": 13863,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7358 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650300393.747, "dur": 347.695, "args": { "External id": 13864,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7359 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650300428.405, "dur": 308.663, "args": { "External id": 13865,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7360, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650300438.972, "dur": 292.920, "args": { "External id": 13866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7361 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650300762.703, "dur": 2.407, "args": { "External id": 13867,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7362, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.17)", "pid": 1336757, "tid": 1336757, "ts": 1295650300854.166, "dur": 16844.714, "args": { "External id": 13868,"Record function id": 0, "Ev Idx": 7363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650300954.176, "dur": 5.689, "args": { "External id": 13869,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650300963.538, "dur": 1.119, "args": { "External id": 13870,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650300966.471, "dur": 2.399, "args": { "External id": 13871,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650300970.399, "dur": 0.864, "args": { "External id": 13872,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650300972.588, "dur": 0.867, "args": { "External id": 13873,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650300975.317, "dur": 0.662, "args": { "External id": 13874,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650300980.246, "dur": 0.880, "args": { "External id": 13875,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650300982.693, "dur": 38.819, "args": { "External id": 13876,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650301026.204, "dur": 1.314, "args": { "External id": 13877,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650301028.991, "dur": 0.780, "args": { "External id": 13878,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7373 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650301051.700, "dur": 16598.526, "args": { "External id": 13879,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650301067.740, "dur": 16574.021, "args": { "External id": 13880,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650301091.295, "dur": 15.020, "args": { "External id": 13881,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650301109.280, "dur": 16495.955, "args": { "External id": 13882,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650301111.932, "dur": 16492.565, "args": { "External id": 13883,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650301117.759, "dur": 5.834, "args": { "External id": 13884,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650301125.418, "dur": 16475.374, "args": { "External id": 13885,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7380 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650317842.838, "dur": 38.289, "args": { "External id": 13886,"Sequence number": 246575, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7381 } }, { "ph": "s", "id": 193, "pid": 1336757, "tid": 1336757, "ts": 1295650317842.838, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650317867.021, "dur": 9.189, "args": { "External id": 13887,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650317870.688, "dur": 5.287, "args": { "External id": 13888,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7383 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650317947.160, "dur": 113.609, "args": { "External id": 13889,"Record function id": 0, "Ev Idx": 7384 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650318064.004, "dur": 1147.782, "args": { "External id": 13890,"Record function id": 0, "Ev Idx": 7385 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650318107.514, "dur": 1089.612, "args": { "External id": 13891,"Sequence number": 246576, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7386 } }, { "ph": "s", "id": 192, "pid": 1336757, "tid": 1336757, "ts": 1295650318107.514, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650318181.045, "dur": 60.507, "args": { "External id": 13892,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650318262.404, "dur": 110.989, "args": { "External id": 13893,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650318384.570, "dur": 40.838, "args": { "External id": 13894,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650318434.542, "dur": 30.852, "args": { "External id": 13895,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7390 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650318497.303, "dur": 28.139, "args": { "External id": 13896,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7391 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650318544.881, "dur": 15.819, "args": { "External id": 13897,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7392 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650318581.205, "dur": 139.126, "args": { "External id": 13898,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650318635.542, "dur": 12.562, "args": { "External id": 13899,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650318640.755, "dur": 6.429, "args": { "External id": 13900,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650318650.946, "dur": 5.493, "args": { "External id": 13901,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650318657.888, "dur": 1.288, "args": { "External id": 13902,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650318662.317, "dur": 4.712, "args": { "External id": 13903,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650318731.654, "dur": 48.986, "args": { "External id": 13904,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7399 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650318812.900, "dur": 29.425, "args": { "External id": 13905,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650318851.317, "dur": 41.153, "args": { "External id": 13906,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650318901.500, "dur": 35.757, "args": { "External id": 13907,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7402 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650318961.216, "dur": 65.968, "args": { "External id": 13908,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650319035.768, "dur": 42.257, "args": { "External id": 13909,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7404 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650319101.017, "dur": 23.030, "args": { "External id": 13910,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7405 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.17)", "pid": 1336757, "tid": 1336757, "ts": 1295650319305.597, "dur": 90.031, "args": { "External id": 13911,"Record function id": 0, "Ev Idx": 7406 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650319477.013, "dur": 48.167, "args": { "External id": 13912,"Record function id": 0, "Ev Idx": 7407 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.18)", "pid": 1336757, "tid": 1336757, "ts": 1295650319534.970, "dur": 17947.351, "args": { "External id": 13913,"Record function id": 0, "Ev Idx": 7408 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.18)", "pid": 1336757, "tid": 1336757, "ts": 1295650319542.567, "dur": 946.417, "args": { "External id": 13914,"Record function id": 0, "Ev Idx": 7409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650319627.037, "dur": 10.401, "args": { "External id": 13915,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650319650.732, "dur": 36.697, "args": { "External id": 13916,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319656.430, "dur": 2.414, "args": { "External id": 13917,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319663.817, "dur": 0.221, "args": { "External id": 13918,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319665.159, "dur": 0.466, "args": { "External id": 13919,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319667.552, "dur": 0.491, "args": { "External id": 13920,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319671.297, "dur": 0.315, "args": { "External id": 13921,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319673.242, "dur": 0.189, "args": { "External id": 13922,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319674.727, "dur": 3.916, "args": { "External id": 13923,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319680.039, "dur": 0.675, "args": { "External id": 13924,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319681.512, "dur": 0.142, "args": { "External id": 13925,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650319699.402, "dur": 43.760, "args": { "External id": 13926,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7421 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650319776.421, "dur": 114.018, "args": { "External id": 13927,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650319790.822, "dur": 6.473, "args": { "External id": 13928,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650319802.291, "dur": 10.399, "args": { "External id": 13929,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650319806.796, "dur": 5.507, "args": { "External id": 13930,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319810.617, "dur": 0.485, "args": { "External id": 13931,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650319819.363, "dur": 30.200, "args": { "External id": 13932,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319821.546, "dur": 0.595, "args": { "External id": 13933,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319823.949, "dur": 2.622, "args": { "External id": 13934,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319828.100, "dur": 0.362, "args": { "External id": 13935,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319830.576, "dur": 1.499, "args": { "External id": 13936,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319835.628, "dur": 0.345, "args": { "External id": 13937,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319837.751, "dur": 0.655, "args": { "External id": 13938,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319839.662, "dur": 0.520, "args": { "External id": 13939,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319843.349, "dur": 0.298, "args": { "External id": 13940,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650319844.928, "dur": 0.190, "args": { "External id": 13941,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650319860.440, "dur": 22.367, "args": { "External id": 13942,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7437 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650319942.221, "dur": 433.781, "args": { "External id": 13943,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7438 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650319975.159, "dur": 394.372, "args": { "External id": 13944,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7439, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650320026.510, "dur": 336.368, "args": { "External id": 13945,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7440 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650320406.751, "dur": 2.531, "args": { "External id": 13946,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7441, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.18)", "pid": 1336757, "tid": 1336757, "ts": 1295650320509.935, "dur": 16737.685, "args": { "External id": 13947,"Record function id": 0, "Ev Idx": 7442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650320612.704, "dur": 7.023, "args": { "External id": 13948,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650320623.207, "dur": 1.130, "args": { "External id": 13949,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650320626.158, "dur": 2.089, "args": { "External id": 13950,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650320629.951, "dur": 0.859, "args": { "External id": 13951,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650320632.270, "dur": 1.167, "args": { "External id": 13952,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650320634.703, "dur": 0.685, "args": { "External id": 13953,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650320639.574, "dur": 0.595, "args": { "External id": 13954,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650320642.216, "dur": 1.894, "args": { "External id": 13955,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650320645.594, "dur": 0.875, "args": { "External id": 13956,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650320648.038, "dur": 0.568, "args": { "External id": 13957,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7452 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650320669.000, "dur": 16513.652, "args": { "External id": 13958,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650320684.686, "dur": 16488.922, "args": { "External id": 13959,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650320706.159, "dur": 14.037, "args": { "External id": 13960,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650320723.306, "dur": 16412.958, "args": { "External id": 13961,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650320725.851, "dur": 16409.566, "args": { "External id": 13962,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650320732.632, "dur": 5.326, "args": { "External id": 13963,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650320739.744, "dur": 16391.975, "args": { "External id": 13964,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7459 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650337414.342, "dur": 42.907, "args": { "External id": 13965,"Sequence number": 246577, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7460 } }, { "ph": "s", "id": 191, "pid": 1336757, "tid": 1336757, "ts": 1295650337414.342, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650337441.267, "dur": 10.992, "args": { "External id": 13966,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650337445.853, "dur": 6.070, "args": { "External id": 13967,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7462 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650337521.940, "dur": 77.521, "args": { "External id": 13968,"Record function id": 0, "Ev Idx": 7463 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650337601.123, "dur": 1151.157, "args": { "External id": 13969,"Record function id": 0, "Ev Idx": 7464 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650337642.026, "dur": 1095.886, "args": { "External id": 13970,"Sequence number": 246578, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7465 } }, { "ph": "s", "id": 190, "pid": 1336757, "tid": 1336757, "ts": 1295650337642.026, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650337715.043, "dur": 43.938, "args": { "External id": 13971,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650337774.054, "dur": 105.764, "args": { "External id": 13972,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650337889.748, "dur": 39.550, "args": { "External id": 13973,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650337935.619, "dur": 31.563, "args": { "External id": 13974,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7469 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650338034.393, "dur": 30.023, "args": { "External id": 13975,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7470 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650338082.569, "dur": 18.860, "args": { "External id": 13976,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7471 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650338117.898, "dur": 159.606, "args": { "External id": 13977,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650338169.506, "dur": 12.978, "args": { "External id": 13978,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650338174.868, "dur": 6.716, "args": { "External id": 13979,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650338185.580, "dur": 5.769, "args": { "External id": 13980,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650338192.858, "dur": 3.460, "args": { "External id": 13981,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650338198.768, "dur": 3.313, "args": { "External id": 13982,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650338293.328, "dur": 72.737, "args": { "External id": 13983,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7478 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650338404.472, "dur": 31.482, "args": { "External id": 13984,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650338445.134, "dur": 43.433, "args": { "External id": 13985,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650338496.540, "dur": 34.393, "args": { "External id": 13986,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7481 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650338558.164, "dur": 26.749, "args": { "External id": 13987,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650338591.631, "dur": 36.324, "args": { "External id": 13988,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7483 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650338646.459, "dur": 21.534, "args": { "External id": 13989,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7484 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.18)", "pid": 1336757, "tid": 1336757, "ts": 1295650338819.587, "dur": 79.272, "args": { "External id": 13990,"Record function id": 0, "Ev Idx": 7485 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650338974.706, "dur": 89.877, "args": { "External id": 13991,"Record function id": 0, "Ev Idx": 7486 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.19)", "pid": 1336757, "tid": 1336757, "ts": 1295650339075.488, "dur": 17847.174, "args": { "External id": 13992,"Record function id": 0, "Ev Idx": 7487 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.19)", "pid": 1336757, "tid": 1336757, "ts": 1295650339085.748, "dur": 991.578, "args": { "External id": 13993,"Record function id": 0, "Ev Idx": 7488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650339170.966, "dur": 10.940, "args": { "External id": 13994,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650339195.474, "dur": 59.716, "args": { "External id": 13995,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339201.523, "dur": 3.043, "args": { "External id": 13996,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339209.676, "dur": 0.640, "args": { "External id": 13997,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339211.925, "dur": 0.943, "args": { "External id": 13998,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339213.903, "dur": 1.160, "args": { "External id": 13999,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339218.792, "dur": 0.738, "args": { "External id": 14000,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339220.750, "dur": 0.823, "args": { "External id": 14001,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339223.148, "dur": 2.670, "args": { "External id": 14002,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339242.012, "dur": 1.515, "args": { "External id": 14003,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339247.108, "dur": 1.101, "args": { "External id": 14004,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650339270.346, "dur": 53.576, "args": { "External id": 14005,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7500 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650339369.629, "dur": 122.218, "args": { "External id": 14006,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650339382.776, "dur": 6.935, "args": { "External id": 14007,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650339394.920, "dur": 10.816, "args": { "External id": 14008,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650339399.638, "dur": 5.707, "args": { "External id": 14009,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339403.114, "dur": 0.799, "args": { "External id": 14010,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650339413.419, "dur": 32.071, "args": { "External id": 14011,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339415.692, "dur": 3.161, "args": { "External id": 14012,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339420.368, "dur": 0.712, "args": { "External id": 14013,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339423.188, "dur": 0.853, "args": { "External id": 14014,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339427.621, "dur": 0.521, "args": { "External id": 14015,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339429.888, "dur": 0.525, "args": { "External id": 14016,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339431.521, "dur": 0.583, "args": { "External id": 14017,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339435.537, "dur": 0.530, "args": { "External id": 14018,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339437.404, "dur": 0.466, "args": { "External id": 14019,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650339439.589, "dur": 2.144, "args": { "External id": 14020,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650339459.413, "dur": 23.980, "args": { "External id": 14021,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7516 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650339549.010, "dur": 390.516, "args": { "External id": 14022,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7517 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650339583.394, "dur": 351.139, "args": { "External id": 14023,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7518, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650339594.407, "dur": 334.356, "args": { "External id": 14024,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7519 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650339961.963, "dur": 2.613, "args": { "External id": 14025,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7520, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.19)", "pid": 1336757, "tid": 1336757, "ts": 1295650340100.024, "dur": 16613.295, "args": { "External id": 14026,"Record function id": 0, "Ev Idx": 7521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650340204.570, "dur": 7.130, "args": { "External id": 14027,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650340227.043, "dur": 19.322, "args": { "External id": 14028,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650340251.941, "dur": 1.296, "args": { "External id": 14029,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650340257.894, "dur": 1.362, "args": { "External id": 14030,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650340261.354, "dur": 1.745, "args": { "External id": 14031,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650340265.311, "dur": 1.893, "args": { "External id": 14032,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650340269.889, "dur": 1.671, "args": { "External id": 14033,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650340276.572, "dur": 2.708, "args": { "External id": 14034,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650340281.405, "dur": 1.455, "args": { "External id": 14035,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650340285.686, "dur": 1.212, "args": { "External id": 14036,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7531 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650340314.067, "dur": 16352.233, "args": { "External id": 14037,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650340334.190, "dur": 16323.790, "args": { "External id": 14038,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650340356.922, "dur": 14.286, "args": { "External id": 14039,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650340376.492, "dur": 16245.871, "args": { "External id": 14040,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650340379.213, "dur": 16242.502, "args": { "External id": 14041,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650340385.067, "dur": 6.121, "args": { "External id": 14042,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650340393.000, "dur": 16225.124, "args": { "External id": 14043,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7538 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650356855.693, "dur": 41.648, "args": { "External id": 14044,"Sequence number": 246579, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7539 } }, { "ph": "s", "id": 189, "pid": 1336757, "tid": 1336757, "ts": 1295650356855.693, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650356882.111, "dur": 10.353, "args": { "External id": 14045,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650356886.288, "dur": 5.892, "args": { "External id": 14046,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7541 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650356962.043, "dur": 111.321, "args": { "External id": 14047,"Record function id": 0, "Ev Idx": 7542 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650357076.672, "dur": 1149.820, "args": { "External id": 14048,"Record function id": 0, "Ev Idx": 7543 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650357117.335, "dur": 1095.376, "args": { "External id": 14049,"Sequence number": 246580, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7544 } }, { "ph": "s", "id": 188, "pid": 1336757, "tid": 1336757, "ts": 1295650357117.335, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650357190.377, "dur": 64.851, "args": { "External id": 14050,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650357276.548, "dur": 116.438, "args": { "External id": 14051,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650357404.376, "dur": 40.023, "args": { "External id": 14052,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650357454.162, "dur": 30.759, "args": { "External id": 14053,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7548 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650357512.860, "dur": 29.864, "args": { "External id": 14054,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7549 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650357564.298, "dur": 15.163, "args": { "External id": 14055,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7550 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650357599.567, "dur": 137.058, "args": { "External id": 14056,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650357654.203, "dur": 12.165, "args": { "External id": 14057,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650357659.831, "dur": 5.690, "args": { "External id": 14058,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650357669.388, "dur": 6.295, "args": { "External id": 14059,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650357677.653, "dur": 1.791, "args": { "External id": 14060,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650357682.015, "dur": 2.751, "args": { "External id": 14061,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650357748.576, "dur": 45.975, "args": { "External id": 14062,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7557 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650357824.680, "dur": 29.685, "args": { "External id": 14063,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650357863.219, "dur": 40.765, "args": { "External id": 14064,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650357912.841, "dur": 35.211, "args": { "External id": 14065,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7560 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650357972.331, "dur": 67.347, "args": { "External id": 14066,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650358048.403, "dur": 40.031, "args": { "External id": 14067,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7562 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650358113.895, "dur": 22.929, "args": { "External id": 14068,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7563 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.19)", "pid": 1336757, "tid": 1336757, "ts": 1295650358323.281, "dur": 85.196, "args": { "External id": 14069,"Record function id": 0, "Ev Idx": 7564 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650358487.185, "dur": 47.585, "args": { "External id": 14070,"Record function id": 0, "Ev Idx": 7565 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.20)", "pid": 1336757, "tid": 1336757, "ts": 1295650358544.017, "dur": 17958.155, "args": { "External id": 14071,"Record function id": 0, "Ev Idx": 7566 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.20)", "pid": 1336757, "tid": 1336757, "ts": 1295650358551.442, "dur": 960.912, "args": { "External id": 14072,"Record function id": 0, "Ev Idx": 7567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650358640.055, "dur": 10.668, "args": { "External id": 14073,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650358664.422, "dur": 39.415, "args": { "External id": 14074,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358670.315, "dur": 2.618, "args": { "External id": 14075,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358677.569, "dur": 0.698, "args": { "External id": 14076,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358680.023, "dur": 0.497, "args": { "External id": 14077,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358682.369, "dur": 0.501, "args": { "External id": 14078,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358686.793, "dur": 0.432, "args": { "External id": 14079,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358688.762, "dur": 0.979, "args": { "External id": 14080,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358691.105, "dur": 2.452, "args": { "External id": 14081,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358694.831, "dur": 0.602, "args": { "External id": 14082,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358697.165, "dur": 0.906, "args": { "External id": 14083,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650358715.164, "dur": 43.543, "args": { "External id": 14084,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7579 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650358792.214, "dur": 113.703, "args": { "External id": 14085,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650358803.214, "dur": 5.040, "args": { "External id": 14086,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650358813.410, "dur": 10.495, "args": { "External id": 14087,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650358818.453, "dur": 5.078, "args": { "External id": 14088,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358821.658, "dur": 0.760, "args": { "External id": 14089,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650358830.812, "dur": 34.623, "args": { "External id": 14090,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358832.961, "dur": 3.171, "args": { "External id": 14091,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358837.527, "dur": 0.571, "args": { "External id": 14092,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358842.841, "dur": 0.625, "args": { "External id": 14093,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358846.587, "dur": 0.657, "args": { "External id": 14094,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358848.430, "dur": 0.862, "args": { "External id": 14095,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358850.682, "dur": 2.795, "args": { "External id": 14096,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358854.670, "dur": 0.837, "args": { "External id": 14097,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358856.945, "dur": 0.529, "args": { "External id": 14098,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650358861.031, "dur": 0.420, "args": { "External id": 14099,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650358875.056, "dur": 22.797, "args": { "External id": 14100,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7595 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650358958.423, "dur": 443.069, "args": { "External id": 14101,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7596 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650359030.086, "dur": 365.689, "args": { "External id": 14102,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7597, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650359042.793, "dur": 345.825, "args": { "External id": 14103,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7598 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650359430.575, "dur": 2.896, "args": { "External id": 14104,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7599, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.20)", "pid": 1336757, "tid": 1336757, "ts": 1295650359534.390, "dur": 16735.253, "args": { "External id": 14105,"Record function id": 0, "Ev Idx": 7600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650359641.668, "dur": 6.875, "args": { "External id": 14106,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650359651.907, "dur": 1.870, "args": { "External id": 14107,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650359655.465, "dur": 1.307, "args": { "External id": 14108,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650359658.386, "dur": 1.235, "args": { "External id": 14109,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650359661.227, "dur": 0.924, "args": { "External id": 14110,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650359663.402, "dur": 1.277, "args": { "External id": 14111,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650359669.080, "dur": 1.348, "args": { "External id": 14112,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650359671.954, "dur": 1.761, "args": { "External id": 14113,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650359675.712, "dur": 1.109, "args": { "External id": 14114,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650359678.134, "dur": 0.756, "args": { "External id": 14115,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7610 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650359699.239, "dur": 16502.293, "args": { "External id": 14116,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650359716.161, "dur": 16476.392, "args": { "External id": 14117,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650359737.460, "dur": 14.480, "args": { "External id": 14118,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650359754.781, "dur": 16400.147, "args": { "External id": 14119,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650359757.231, "dur": 16396.661, "args": { "External id": 14120,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650359763.193, "dur": 5.833, "args": { "External id": 14121,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650359771.057, "dur": 16379.471, "args": { "External id": 14122,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7617 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650376429.514, "dur": 46.495, "args": { "External id": 14123,"Sequence number": 246581, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7618 } }, { "ph": "s", "id": 187, "pid": 1336757, "tid": 1336757, "ts": 1295650376429.514, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650376460.768, "dur": 10.339, "args": { "External id": 14124,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650376464.866, "dur": 6.033, "args": { "External id": 14125,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7620 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650376542.864, "dur": 77.375, "args": { "External id": 14126,"Record function id": 0, "Ev Idx": 7621 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650376621.894, "dur": 1157.794, "args": { "External id": 14127,"Record function id": 0, "Ev Idx": 7622 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650376662.888, "dur": 1102.459, "args": { "External id": 14128,"Sequence number": 246582, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7623 } }, { "ph": "s", "id": 186, "pid": 1336757, "tid": 1336757, "ts": 1295650376662.888, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650376730.415, "dur": 45.469, "args": { "External id": 14129,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650376788.596, "dur": 105.538, "args": { "External id": 14130,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650376905.928, "dur": 37.786, "args": { "External id": 14131,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650376951.192, "dur": 69.486, "args": { "External id": 14132,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7627 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650377056.762, "dur": 30.092, "args": { "External id": 14133,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7628 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650377103.964, "dur": 17.512, "args": { "External id": 14134,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7629 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650377139.336, "dur": 170.860, "args": { "External id": 14135,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650377192.633, "dur": 12.200, "args": { "External id": 14136,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650377197.352, "dur": 6.761, "args": { "External id": 14137,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650377207.898, "dur": 5.988, "args": { "External id": 14138,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650377215.263, "dur": 1.702, "args": { "External id": 14139,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650377222.501, "dur": 3.535, "args": { "External id": 14140,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650377329.365, "dur": 64.210, "args": { "External id": 14141,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7636 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650377430.879, "dur": 30.341, "args": { "External id": 14142,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650377470.981, "dur": 42.904, "args": { "External id": 14143,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650377521.096, "dur": 35.125, "args": { "External id": 14144,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7639 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650377580.169, "dur": 30.383, "args": { "External id": 14145,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650377617.456, "dur": 37.638, "args": { "External id": 14146,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7641 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650377674.686, "dur": 19.126, "args": { "External id": 14147,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7642 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.20)", "pid": 1336757, "tid": 1336757, "ts": 1295650377847.865, "dur": 77.439, "args": { "External id": 14148,"Record function id": 0, "Ev Idx": 7643 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650378042.812, "dur": 49.643, "args": { "External id": 14149,"Record function id": 0, "Ev Idx": 7644 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.21)", "pid": 1336757, "tid": 1336757, "ts": 1295650378101.589, "dur": 18028.574, "args": { "External id": 14150,"Record function id": 0, "Ev Idx": 7645 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.21)", "pid": 1336757, "tid": 1336757, "ts": 1295650378109.925, "dur": 949.990, "args": { "External id": 14151,"Record function id": 0, "Ev Idx": 7646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650378195.227, "dur": 11.298, "args": { "External id": 14152,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650378220.489, "dur": 66.194, "args": { "External id": 14153,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378226.169, "dur": 18.786, "args": { "External id": 14154,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378252.047, "dur": 1.116, "args": { "External id": 14155,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378255.235, "dur": 1.037, "args": { "External id": 14156,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378258.600, "dur": 0.806, "args": { "External id": 14157,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378263.545, "dur": 1.051, "args": { "External id": 14158,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378266.896, "dur": 1.199, "args": { "External id": 14159,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378270.206, "dur": 2.351, "args": { "External id": 14160,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378275.278, "dur": 1.142, "args": { "External id": 14161,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378278.705, "dur": 1.155, "args": { "External id": 14162,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650378301.640, "dur": 50.688, "args": { "External id": 14163,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7658 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650378390.274, "dur": 122.939, "args": { "External id": 14164,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650378403.366, "dur": 6.122, "args": { "External id": 14165,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650378414.812, "dur": 11.458, "args": { "External id": 14166,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650378419.659, "dur": 6.225, "args": { "External id": 14167,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378423.699, "dur": 0.861, "args": { "External id": 14168,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650378432.974, "dur": 31.657, "args": { "External id": 14169,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378435.693, "dur": 3.115, "args": { "External id": 14170,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378440.429, "dur": 0.648, "args": { "External id": 14171,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378442.286, "dur": 0.425, "args": { "External id": 14172,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378446.494, "dur": 0.431, "args": { "External id": 14173,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378448.087, "dur": 0.385, "args": { "External id": 14174,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378450.222, "dur": 0.720, "args": { "External id": 14175,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378454.226, "dur": 0.713, "args": { "External id": 14176,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378456.466, "dur": 0.580, "args": { "External id": 14177,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650378458.303, "dur": 2.522, "args": { "External id": 14178,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650378481.287, "dur": 23.231, "args": { "External id": 14179,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7674 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650378579.537, "dur": 351.810, "args": { "External id": 14180,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7675 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650378613.291, "dur": 313.194, "args": { "External id": 14181,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7676, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650378623.873, "dur": 290.231, "args": { "External id": 14182,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7677 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650378952.509, "dur": 2.360, "args": { "External id": 14183,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7678, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.21)", "pid": 1336757, "tid": 1336757, "ts": 1295650379083.407, "dur": 16805.671, "args": { "External id": 14184,"Record function id": 0, "Ev Idx": 7679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650379184.387, "dur": 7.347, "args": { "External id": 14185,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650379195.455, "dur": 1.482, "args": { "External id": 14186,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650379198.499, "dur": 1.462, "args": { "External id": 14187,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650379201.453, "dur": 1.242, "args": { "External id": 14188,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650379203.975, "dur": 0.763, "args": { "External id": 14189,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650379208.245, "dur": 1.156, "args": { "External id": 14190,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650379211.179, "dur": 1.311, "args": { "External id": 14191,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650379213.947, "dur": 2.163, "args": { "External id": 14192,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650379217.745, "dur": 1.172, "args": { "External id": 14193,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650379222.930, "dur": 0.818, "args": { "External id": 14194,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7689 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650379263.572, "dur": 16578.297, "args": { "External id": 14195,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650379283.642, "dur": 16550.365, "args": { "External id": 14196,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650379308.970, "dur": 16.968, "args": { "External id": 14197,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650379329.912, "dur": 16468.444, "args": { "External id": 14198,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650379333.184, "dur": 16464.525, "args": { "External id": 14199,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650379339.677, "dur": 7.100, "args": { "External id": 14200,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650379348.427, "dur": 16445.908, "args": { "External id": 14201,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7696 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650396058.777, "dur": 40.121, "args": { "External id": 14202,"Sequence number": 246583, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7697 } }, { "ph": "s", "id": 185, "pid": 1336757, "tid": 1336757, "ts": 1295650396058.777, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650396083.262, "dur": 10.451, "args": { "External id": 14203,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650396087.309, "dur": 6.038, "args": { "External id": 14204,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7699 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650396173.903, "dur": 101.611, "args": { "External id": 14205,"Record function id": 0, "Ev Idx": 7700 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650396279.653, "dur": 1153.304, "args": { "External id": 14206,"Record function id": 0, "Ev Idx": 7701 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650396326.199, "dur": 1091.560, "args": { "External id": 14207,"Sequence number": 246584, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7702 } }, { "ph": "s", "id": 184, "pid": 1336757, "tid": 1336757, "ts": 1295650396326.199, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650396399.601, "dur": 51.257, "args": { "External id": 14208,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650396465.518, "dur": 107.317, "args": { "External id": 14209,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650396582.414, "dur": 40.998, "args": { "External id": 14210,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650396632.774, "dur": 31.819, "args": { "External id": 14211,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7706 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650396690.438, "dur": 27.097, "args": { "External id": 14212,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7707 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650396734.929, "dur": 15.030, "args": { "External id": 14213,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7708 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650396767.697, "dur": 130.429, "args": { "External id": 14214,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650396817.858, "dur": 12.225, "args": { "External id": 14215,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650396822.830, "dur": 6.393, "args": { "External id": 14216,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650396833.183, "dur": 5.789, "args": { "External id": 14217,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650396840.228, "dur": 1.604, "args": { "External id": 14218,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650396844.754, "dur": 3.864, "args": { "External id": 14219,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650396908.924, "dur": 45.053, "args": { "External id": 14220,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7715 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650397023.113, "dur": 32.371, "args": { "External id": 14221,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650397066.890, "dur": 45.802, "args": { "External id": 14222,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650397122.661, "dur": 34.886, "args": { "External id": 14223,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7718 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650397182.383, "dur": 27.399, "args": { "External id": 14224,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650397216.724, "dur": 61.026, "args": { "External id": 14225,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7720 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650397309.661, "dur": 31.526, "args": { "External id": 14226,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7721 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.21)", "pid": 1336757, "tid": 1336757, "ts": 1295650397500.775, "dur": 76.017, "args": { "External id": 14227,"Record function id": 0, "Ev Idx": 7722 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650397648.000, "dur": 45.688, "args": { "External id": 14228,"Record function id": 0, "Ev Idx": 7723 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.22)", "pid": 1336757, "tid": 1336757, "ts": 1295650397702.868, "dur": 18135.312, "args": { "External id": 14229,"Record function id": 0, "Ev Idx": 7724 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.22)", "pid": 1336757, "tid": 1336757, "ts": 1295650397711.942, "dur": 936.552, "args": { "External id": 14230,"Record function id": 0, "Ev Idx": 7725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650397795.443, "dur": 9.259, "args": { "External id": 14231,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650397817.715, "dur": 37.227, "args": { "External id": 14232,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650397823.013, "dur": 2.351, "args": { "External id": 14233,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650397830.291, "dur": 0.838, "args": { "External id": 14234,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650397832.262, "dur": 0.835, "args": { "External id": 14235,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650397834.658, "dur": 0.789, "args": { "External id": 14236,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650397838.363, "dur": 0.580, "args": { "External id": 14237,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650397840.159, "dur": 0.524, "args": { "External id": 14238,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650397841.892, "dur": 2.761, "args": { "External id": 14239,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650397846.278, "dur": 0.521, "args": { "External id": 14240,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650397848.176, "dur": 0.797, "args": { "External id": 14241,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650397865.606, "dur": 39.210, "args": { "External id": 14242,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7737 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650397936.369, "dur": 165.949, "args": { "External id": 14243,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650397947.247, "dur": 4.693, "args": { "External id": 14244,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650397957.027, "dur": 10.927, "args": { "External id": 14245,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650397961.501, "dur": 6.068, "args": { "External id": 14246,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650397965.180, "dur": 0.977, "args": { "External id": 14247,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650397974.351, "dur": 78.041, "args": { "External id": 14248,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650397976.337, "dur": 3.048, "args": { "External id": 14249,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650398020.109, "dur": 1.014, "args": { "External id": 14250,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650398023.076, "dur": 0.933, "args": { "External id": 14251,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650398028.254, "dur": 0.495, "args": { "External id": 14252,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650398030.025, "dur": 0.547, "args": { "External id": 14253,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650398031.996, "dur": 0.920, "args": { "External id": 14254,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650398036.040, "dur": 0.745, "args": { "External id": 14255,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650398038.952, "dur": 0.836, "args": { "External id": 14256,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650398044.375, "dur": 2.938, "args": { "External id": 14257,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650398067.560, "dur": 26.072, "args": { "External id": 14258,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7753 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650398157.729, "dur": 381.884, "args": { "External id": 14259,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7754 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650398189.740, "dur": 344.053, "args": { "External id": 14260,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7755, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650398200.719, "dur": 326.578, "args": { "External id": 14261,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7756 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650398567.577, "dur": 3.121, "args": { "External id": 14262,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7757, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.22)", "pid": 1336757, "tid": 1336757, "ts": 1295650398671.152, "dur": 16957.808, "args": { "External id": 14263,"Record function id": 0, "Ev Idx": 7758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650398773.313, "dur": 6.417, "args": { "External id": 14264,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650398783.324, "dur": 1.718, "args": { "External id": 14265,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650398786.919, "dur": 1.574, "args": { "External id": 14266,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650398789.973, "dur": 1.126, "args": { "External id": 14267,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650398792.742, "dur": 1.266, "args": { "External id": 14268,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650398797.423, "dur": 0.956, "args": { "External id": 14269,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650398799.904, "dur": 1.257, "args": { "External id": 14270,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650398803.373, "dur": 2.507, "args": { "External id": 14271,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650398807.418, "dur": 1.152, "args": { "External id": 14272,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650398812.059, "dur": 0.813, "args": { "External id": 14273,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7768 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650398830.253, "dur": 16750.504, "args": { "External id": 14274,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650398852.807, "dur": 16719.331, "args": { "External id": 14275,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650398872.263, "dur": 14.143, "args": { "External id": 14276,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650398889.282, "dur": 16646.438, "args": { "External id": 14277,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650398891.821, "dur": 16643.248, "args": { "External id": 14278,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650398898.240, "dur": 6.223, "args": { "External id": 14279,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650398906.188, "dur": 16625.142, "args": { "External id": 14280,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7775 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650415771.790, "dur": 38.742, "args": { "External id": 14281,"Sequence number": 246585, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7776 } }, { "ph": "s", "id": 183, "pid": 1336757, "tid": 1336757, "ts": 1295650415771.790, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650415795.518, "dur": 10.113, "args": { "External id": 14282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650415799.785, "dur": 5.599, "args": { "External id": 14283,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7778 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650415879.753, "dur": 77.270, "args": { "External id": 14284,"Record function id": 0, "Ev Idx": 7779 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650415958.705, "dur": 1165.818, "args": { "External id": 14285,"Record function id": 0, "Ev Idx": 7780 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650416031.894, "dur": 1077.803, "args": { "External id": 14286,"Sequence number": 246586, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7781 } }, { "ph": "s", "id": 182, "pid": 1336757, "tid": 1336757, "ts": 1295650416031.894, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650416100.952, "dur": 45.549, "args": { "External id": 14287,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650416160.801, "dur": 125.447, "args": { "External id": 14288,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650416303.544, "dur": 45.974, "args": { "External id": 14289,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650416359.758, "dur": 30.610, "args": { "External id": 14290,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7785 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650416420.383, "dur": 28.560, "args": { "External id": 14291,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7786 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650416468.414, "dur": 17.321, "args": { "External id": 14292,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7787 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650416504.951, "dur": 137.481, "args": { "External id": 14293,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650416560.216, "dur": 13.177, "args": { "External id": 14294,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650416565.655, "dur": 6.824, "args": { "External id": 14295,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650416576.187, "dur": 5.107, "args": { "External id": 14296,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650416582.698, "dur": 1.640, "args": { "External id": 14297,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650416586.734, "dur": 4.194, "args": { "External id": 14298,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650416653.077, "dur": 48.950, "args": { "External id": 14299,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7794 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650416735.214, "dur": 29.227, "args": { "External id": 14300,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650416772.658, "dur": 41.949, "args": { "External id": 14301,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650416824.034, "dur": 34.675, "args": { "External id": 14302,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7797 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650416883.457, "dur": 30.511, "args": { "External id": 14303,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650416920.415, "dur": 33.702, "args": { "External id": 14304,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7799 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650416974.604, "dur": 58.338, "args": { "External id": 14305,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7800 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.22)", "pid": 1336757, "tid": 1336757, "ts": 1295650417192.139, "dur": 110.535, "args": { "External id": 14306,"Record function id": 0, "Ev Idx": 7801 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650417393.190, "dur": 49.762, "args": { "External id": 14307,"Record function id": 0, "Ev Idx": 7802 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.23)", "pid": 1336757, "tid": 1336757, "ts": 1295650417452.551, "dur": 18040.601, "args": { "External id": 14308,"Record function id": 0, "Ev Idx": 7803 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.23)", "pid": 1336757, "tid": 1336757, "ts": 1295650417460.268, "dur": 971.127, "args": { "External id": 14309,"Record function id": 0, "Ev Idx": 7804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650417548.098, "dur": 11.724, "args": { "External id": 14310,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650417573.697, "dur": 40.002, "args": { "External id": 14311,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417579.410, "dur": 2.492, "args": { "External id": 14312,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417586.161, "dur": 0.798, "args": { "External id": 14313,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417588.749, "dur": 0.815, "args": { "External id": 14314,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417591.153, "dur": 0.813, "args": { "External id": 14315,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417596.305, "dur": 0.669, "args": { "External id": 14316,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417598.425, "dur": 0.798, "args": { "External id": 14317,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417600.921, "dur": 2.399, "args": { "External id": 14318,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417604.788, "dur": 0.632, "args": { "External id": 14319,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417607.201, "dur": 0.693, "args": { "External id": 14320,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650417624.803, "dur": 43.730, "args": { "External id": 14321,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7816 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650417702.217, "dur": 145.793, "args": { "External id": 14322,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650417713.318, "dur": 4.637, "args": { "External id": 14323,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650417723.064, "dur": 11.100, "args": { "External id": 14324,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650417727.853, "dur": 5.886, "args": { "External id": 14325,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417731.580, "dur": 0.941, "args": { "External id": 14326,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650417740.778, "dur": 31.897, "args": { "External id": 14327,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417742.822, "dur": 2.400, "args": { "External id": 14328,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417746.727, "dur": 0.768, "args": { "External id": 14329,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417748.936, "dur": 0.859, "args": { "External id": 14330,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417753.368, "dur": 0.658, "args": { "External id": 14331,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417756.168, "dur": 0.627, "args": { "External id": 14332,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417758.088, "dur": 0.979, "args": { "External id": 14333,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417762.263, "dur": 0.544, "args": { "External id": 14334,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417764.047, "dur": 0.808, "args": { "External id": 14335,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650417766.464, "dur": 2.348, "args": { "External id": 14336,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650417817.239, "dur": 22.518, "args": { "External id": 14337,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7832 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650417901.523, "dur": 413.488, "args": { "External id": 14338,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7833 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650417933.105, "dur": 376.068, "args": { "External id": 14339,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7834, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650417945.225, "dur": 355.565, "args": { "External id": 14340,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7835 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650418345.034, "dur": 3.696, "args": { "External id": 14341,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7836, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.23)", "pid": 1336757, "tid": 1336757, "ts": 1295650418453.180, "dur": 16809.262, "args": { "External id": 14342,"Record function id": 0, "Ev Idx": 7837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650418556.439, "dur": 6.923, "args": { "External id": 14343,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650418566.808, "dur": 1.363, "args": { "External id": 14344,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650418569.885, "dur": 1.273, "args": { "External id": 14345,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650418572.706, "dur": 1.295, "args": { "External id": 14346,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650418575.403, "dur": 1.046, "args": { "External id": 14347,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650418580.220, "dur": 0.915, "args": { "External id": 14348,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650418582.896, "dur": 0.882, "args": { "External id": 14349,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650418585.093, "dur": 2.439, "args": { "External id": 14350,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650418589.069, "dur": 1.365, "args": { "External id": 14351,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650418593.725, "dur": 1.183, "args": { "External id": 14352,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7847 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650418614.000, "dur": 16584.858, "args": { "External id": 14353,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650418629.980, "dur": 16560.490, "args": { "External id": 14354,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650418654.265, "dur": 15.012, "args": { "External id": 14355,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650418672.237, "dur": 16481.406, "args": { "External id": 14356,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650418674.667, "dur": 16478.226, "args": { "External id": 14357,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650418680.799, "dur": 5.790, "args": { "External id": 14358,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650418688.452, "dur": 16460.878, "args": { "External id": 14359,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7854 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650435421.966, "dur": 42.403, "args": { "External id": 14360,"Sequence number": 246587, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7855 } }, { "ph": "s", "id": 181, "pid": 1336757, "tid": 1336757, "ts": 1295650435421.966, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650435449.220, "dur": 10.113, "args": { "External id": 14361,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650435453.157, "dur": 5.886, "args": { "External id": 14362,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7857 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650435532.890, "dur": 78.505, "args": { "External id": 14363,"Record function id": 0, "Ev Idx": 7858 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650435613.141, "dur": 1133.881, "args": { "External id": 14364,"Record function id": 0, "Ev Idx": 7859 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650435654.842, "dur": 1078.512, "args": { "External id": 14365,"Sequence number": 246588, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7860 } }, { "ph": "s", "id": 180, "pid": 1336757, "tid": 1336757, "ts": 1295650435654.842, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650435722.855, "dur": 45.995, "args": { "External id": 14366,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650435782.383, "dur": 104.183, "args": { "External id": 14367,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650435895.982, "dur": 37.834, "args": { "External id": 14368,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650435943.406, "dur": 31.184, "args": { "External id": 14369,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7864 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650436040.969, "dur": 29.038, "args": { "External id": 14370,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7865 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650436089.617, "dur": 16.303, "args": { "External id": 14371,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7866 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650436125.416, "dur": 157.853, "args": { "External id": 14372,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650436178.814, "dur": 13.437, "args": { "External id": 14373,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650436184.246, "dur": 7.140, "args": { "External id": 14374,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650436194.935, "dur": 5.289, "args": { "External id": 14375,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650436201.475, "dur": 1.354, "args": { "External id": 14376,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650436205.562, "dur": 3.684, "args": { "External id": 14377,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650436298.284, "dur": 63.183, "args": { "External id": 14378,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7873 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650436396.238, "dur": 30.850, "args": { "External id": 14379,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650436436.266, "dur": 42.936, "args": { "External id": 14380,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650436489.076, "dur": 34.933, "args": { "External id": 14381,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7876 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650436548.904, "dur": 26.847, "args": { "External id": 14382,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650436581.847, "dur": 34.737, "args": { "External id": 14383,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7878 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650436637.110, "dur": 21.525, "args": { "External id": 14384,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7879 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.23)", "pid": 1336757, "tid": 1336757, "ts": 1295650436812.164, "dur": 79.750, "args": { "External id": 14385,"Record function id": 0, "Ev Idx": 7880 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650436965.061, "dur": 88.232, "args": { "External id": 14386,"Record function id": 0, "Ev Idx": 7881 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.24)", "pid": 1336757, "tid": 1336757, "ts": 1295650437064.723, "dur": 18241.787, "args": { "External id": 14387,"Record function id": 0, "Ev Idx": 7882 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.24)", "pid": 1336757, "tid": 1336757, "ts": 1295650437074.177, "dur": 901.145, "args": { "External id": 14388,"Record function id": 0, "Ev Idx": 7883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650437157.860, "dur": 9.776, "args": { "External id": 14389,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650437181.123, "dur": 38.591, "args": { "External id": 14390,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437186.800, "dur": 2.269, "args": { "External id": 14391,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437194.096, "dur": 0.727, "args": { "External id": 14392,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437195.976, "dur": 0.818, "args": { "External id": 14393,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437198.371, "dur": 0.884, "args": { "External id": 14394,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437202.726, "dur": 0.636, "args": { "External id": 14395,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437204.969, "dur": 0.977, "args": { "External id": 14396,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437206.729, "dur": 2.690, "args": { "External id": 14397,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437211.128, "dur": 0.600, "args": { "External id": 14398,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437212.975, "dur": 0.741, "args": { "External id": 14399,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650437247.332, "dur": 52.224, "args": { "External id": 14400,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7895 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650437346.737, "dur": 124.883, "args": { "External id": 14401,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650437359.106, "dur": 7.371, "args": { "External id": 14402,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650437371.648, "dur": 12.014, "args": { "External id": 14403,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650437376.509, "dur": 6.749, "args": { "External id": 14404,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437380.531, "dur": 0.856, "args": { "External id": 14405,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650437391.319, "dur": 31.930, "args": { "External id": 14406,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437393.343, "dur": 2.506, "args": { "External id": 14407,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437397.921, "dur": 0.704, "args": { "External id": 14408,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437399.919, "dur": 0.692, "args": { "External id": 14409,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437404.316, "dur": 0.716, "args": { "External id": 14410,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437406.133, "dur": 0.569, "args": { "External id": 14411,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437408.694, "dur": 0.667, "args": { "External id": 14412,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437412.383, "dur": 0.706, "args": { "External id": 14413,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437414.401, "dur": 0.856, "args": { "External id": 14414,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650437416.269, "dur": 2.719, "args": { "External id": 14415,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650437438.196, "dur": 24.792, "args": { "External id": 14416,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7911 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650437528.832, "dur": 353.478, "args": { "External id": 14417,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7912 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650437566.806, "dur": 310.520, "args": { "External id": 14418,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7913, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650437577.010, "dur": 294.564, "args": { "External id": 14419,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7914 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650437904.971, "dur": 2.216, "args": { "External id": 14420,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7915, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.24)", "pid": 1336757, "tid": 1336757, "ts": 1295650438037.466, "dur": 17028.928, "args": { "External id": 14421,"Record function id": 0, "Ev Idx": 7916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650438143.998, "dur": 6.843, "args": { "External id": 14422,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650438160.014, "dur": 1.580, "args": { "External id": 14423,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650438163.534, "dur": 1.249, "args": { "External id": 14424,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650438168.412, "dur": 1.132, "args": { "External id": 14425,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650438170.752, "dur": 1.448, "args": { "External id": 14426,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650438173.347, "dur": 0.940, "args": { "External id": 14427,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650438175.633, "dur": 1.159, "args": { "External id": 14428,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650438180.507, "dur": 1.973, "args": { "External id": 14429,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650438183.903, "dur": 1.076, "args": { "External id": 14430,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650438186.699, "dur": 0.702, "args": { "External id": 14431,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7926 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650438208.321, "dur": 16807.912, "args": { "External id": 14432,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650438223.959, "dur": 16783.622, "args": { "External id": 14433,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650438265.033, "dur": 17.074, "args": { "External id": 14434,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650438289.107, "dur": 16659.221, "args": { "External id": 14435,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650438291.915, "dur": 16655.676, "args": { "External id": 14436,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650438299.346, "dur": 8.448, "args": { "External id": 14437,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650438310.040, "dur": 16634.251, "args": { "External id": 14438,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7933 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650455212.629, "dur": 58.284, "args": { "External id": 14439,"Sequence number": 246589, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7934 } }, { "ph": "s", "id": 179, "pid": 1336757, "tid": 1336757, "ts": 1295650455212.629, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650455244.408, "dur": 19.718, "args": { "External id": 14440,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650455256.282, "dur": 7.099, "args": { "External id": 14441,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7936 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650455346.172, "dur": 80.883, "args": { "External id": 14442,"Record function id": 0, "Ev Idx": 7937 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650455428.586, "dur": 1164.331, "args": { "External id": 14443,"Record function id": 0, "Ev Idx": 7938 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650455468.638, "dur": 1109.347, "args": { "External id": 14444,"Sequence number": 246590, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7939 } }, { "ph": "s", "id": 178, "pid": 1336757, "tid": 1336757, "ts": 1295650455468.638, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650455542.526, "dur": 47.205, "args": { "External id": 14445,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650455604.122, "dur": 105.490, "args": { "External id": 14446,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650455719.031, "dur": 39.515, "args": { "External id": 14447,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650455767.431, "dur": 31.159, "args": { "External id": 14448,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7943 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650455825.600, "dur": 27.416, "args": { "External id": 14449,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7944 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650455872.019, "dur": 19.353, "args": { "External id": 14450,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7945 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650455909.017, "dur": 176.997, "args": { "External id": 14451,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650455961.328, "dur": 12.056, "args": { "External id": 14452,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650455965.961, "dur": 6.633, "args": { "External id": 14453,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650455975.940, "dur": 4.901, "args": { "External id": 14454,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650456020.347, "dur": 2.915, "args": { "External id": 14455,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650456026.595, "dur": 3.881, "args": { "External id": 14456,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650456097.847, "dur": 53.370, "args": { "External id": 14457,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7952 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650456185.352, "dur": 30.057, "args": { "External id": 14458,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650456224.261, "dur": 79.887, "args": { "External id": 14459,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650456318.830, "dur": 37.392, "args": { "External id": 14460,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7955 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650456393.074, "dur": 29.720, "args": { "External id": 14461,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650456431.753, "dur": 38.066, "args": { "External id": 14462,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7957 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650456490.241, "dur": 17.777, "args": { "External id": 14463,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7958 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.24)", "pid": 1336757, "tid": 1336757, "ts": 1295650456662.004, "dur": 80.256, "args": { "External id": 14464,"Record function id": 0, "Ev Idx": 7959 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650456816.835, "dur": 47.959, "args": { "External id": 14465,"Record function id": 0, "Ev Idx": 7960 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.25)", "pid": 1336757, "tid": 1336757, "ts": 1295650456874.631, "dur": 18036.028, "args": { "External id": 14466,"Record function id": 0, "Ev Idx": 7961 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.25)", "pid": 1336757, "tid": 1336757, "ts": 1295650456883.908, "dur": 974.223, "args": { "External id": 14467,"Record function id": 0, "Ev Idx": 7962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650456963.904, "dur": 10.151, "args": { "External id": 14468,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650457032.081, "dur": 38.469, "args": { "External id": 14469,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457037.644, "dur": 2.569, "args": { "External id": 14470,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457045.047, "dur": 0.777, "args": { "External id": 14471,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457047.414, "dur": 0.438, "args": { "External id": 14472,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457049.264, "dur": 0.606, "args": { "External id": 14473,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457053.196, "dur": 0.788, "args": { "External id": 14474,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457055.578, "dur": 0.875, "args": { "External id": 14475,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457057.420, "dur": 2.728, "args": { "External id": 14476,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457061.598, "dur": 0.987, "args": { "External id": 14477,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457063.879, "dur": 0.765, "args": { "External id": 14478,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650457082.358, "dur": 43.211, "args": { "External id": 14479,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7974 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650457160.460, "dur": 156.498, "args": { "External id": 14480,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650457172.268, "dur": 5.852, "args": { "External id": 14481,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650457182.974, "dur": 11.279, "args": { "External id": 14482,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650457187.567, "dur": 6.267, "args": { "External id": 14483,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457191.572, "dur": 0.987, "args": { "External id": 14484,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650457201.640, "dur": 49.862, "args": { "External id": 14485,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457203.801, "dur": 2.946, "args": { "External id": 14486,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457208.413, "dur": 0.683, "args": { "External id": 14487,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457209.949, "dur": 1.055, "args": { "External id": 14488,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457214.831, "dur": 0.793, "args": { "External id": 14489,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457216.636, "dur": 0.784, "args": { "External id": 14490,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457219.138, "dur": 0.740, "args": { "External id": 14491,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457222.296, "dur": 0.980, "args": { "External id": 14492,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457224.578, "dur": 0.935, "args": { "External id": 14493,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650457226.771, "dur": 18.511, "args": { "External id": 14494,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650457272.928, "dur": 32.939, "args": { "External id": 14495,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7990 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650457380.381, "dur": 384.882, "args": { "External id": 14496,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7991 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650457412.670, "dur": 347.834, "args": { "External id": 14497,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7992, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650457423.681, "dur": 331.153, "args": { "External id": 14498,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7993 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650457787.378, "dur": 2.471, "args": { "External id": 14499,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7994, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.25)", "pid": 1336757, "tid": 1336757, "ts": 1295650457880.195, "dur": 16821.074, "args": { "External id": 14500,"Record function id": 0, "Ev Idx": 7995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650457983.494, "dur": 44.958, "args": { "External id": 14501,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650458034.691, "dur": 1.714, "args": { "External id": 14502,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650458038.357, "dur": 1.224, "args": { "External id": 14503,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650458041.669, "dur": 1.238, "args": { "External id": 14504,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650458044.304, "dur": 1.130, "args": { "External id": 14505,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650458046.603, "dur": 1.067, "args": { "External id": 14506,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650458051.576, "dur": 1.036, "args": { "External id": 14507,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650458054.260, "dur": 1.881, "args": { "External id": 14508,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650458058.005, "dur": 0.876, "args": { "External id": 14509,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650458060.146, "dur": 0.928, "args": { "External id": 14510,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8005 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650458083.962, "dur": 16572.409, "args": { "External id": 14511,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650458100.998, "dur": 16547.763, "args": { "External id": 14512,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650458126.545, "dur": 15.702, "args": { "External id": 14513,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650458145.187, "dur": 16467.341, "args": { "External id": 14514,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 8009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650458148.093, "dur": 16463.751, "args": { "External id": 14515,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 8010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650458154.292, "dur": 6.207, "args": { "External id": 14516,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650458162.283, "dur": 16446.120, "args": { "External id": 14517,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 8012 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650474845.443, "dur": 40.376, "args": { "External id": 14518,"Sequence number": 246591, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 8013 } }, { "ph": "s", "id": 177, "pid": 1336757, "tid": 1336757, "ts": 1295650474845.443, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650474870.531, "dur": 10.032, "args": { "External id": 14519,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 8014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650474874.799, "dur": 5.507, "args": { "External id": 14520,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8015 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650474950.618, "dur": 110.273, "args": { "External id": 14521,"Record function id": 0, "Ev Idx": 8016 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650475064.522, "dur": 1135.218, "args": { "External id": 14522,"Record function id": 0, "Ev Idx": 8017 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650475106.458, "dur": 1078.890, "args": { "External id": 14523,"Sequence number": 246592, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 8018 } }, { "ph": "s", "id": 176, "pid": 1336757, "tid": 1336757, "ts": 1295650475106.458, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650475182.177, "dur": 62.304, "args": { "External id": 14524,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650475266.397, "dur": 103.743, "args": { "External id": 14525,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650475380.494, "dur": 39.577, "args": { "External id": 14526,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650475429.818, "dur": 30.223, "args": { "External id": 14527,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8022 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650475489.820, "dur": 29.475, "args": { "External id": 14528,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8023 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650475539.898, "dur": 16.303, "args": { "External id": 14529,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8024 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650475575.674, "dur": 132.579, "args": { "External id": 14530,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650475628.408, "dur": 12.752, "args": { "External id": 14531,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650475633.853, "dur": 6.461, "args": { "External id": 14532,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650475643.882, "dur": 5.264, "args": { "External id": 14533,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650475650.273, "dur": 1.491, "args": { "External id": 14534,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650475654.029, "dur": 3.659, "args": { "External id": 14535,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650475719.000, "dur": 45.226, "args": { "External id": 14536,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8031 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650475794.645, "dur": 30.519, "args": { "External id": 14537,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650475833.514, "dur": 40.244, "args": { "External id": 14538,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650475882.924, "dur": 34.791, "args": { "External id": 14539,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8034 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650475942.272, "dur": 36.452, "args": { "External id": 14540,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 8035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650476021.727, "dur": 41.592, "args": { "External id": 14541,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 8036 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650476087.823, "dur": 23.702, "args": { "External id": 14542,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 8037 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.25)", "pid": 1336757, "tid": 1336757, "ts": 1295650476292.121, "dur": 83.484, "args": { "External id": 14543,"Record function id": 0, "Ev Idx": 8038 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650476451.406, "dur": 46.224, "args": { "External id": 14544,"Record function id": 0, "Ev Idx": 8039 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.26)", "pid": 1336757, "tid": 1336757, "ts": 1295650476506.896, "dur": 18065.122, "args": { "External id": 14545,"Record function id": 0, "Ev Idx": 8040 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.26)", "pid": 1336757, "tid": 1336757, "ts": 1295650476514.589, "dur": 952.860, "args": { "External id": 14546,"Record function id": 0, "Ev Idx": 8041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650476602.574, "dur": 10.634, "args": { "External id": 14547,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650476626.059, "dur": 39.250, "args": { "External id": 14548,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476631.850, "dur": 2.425, "args": { "External id": 14549,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476638.890, "dur": 0.987, "args": { "External id": 14550,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476641.693, "dur": 0.828, "args": { "External id": 14551,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476643.759, "dur": 0.779, "args": { "External id": 14552,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476648.465, "dur": 0.691, "args": { "External id": 14553,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476650.432, "dur": 0.622, "args": { "External id": 14554,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476652.598, "dur": 2.701, "args": { "External id": 14555,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476656.296, "dur": 0.646, "args": { "External id": 14556,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476658.408, "dur": 0.776, "args": { "External id": 14557,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650476677.368, "dur": 45.848, "args": { "External id": 14558,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8053 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650476756.860, "dur": 121.067, "args": { "External id": 14559,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 8054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650476768.207, "dur": 5.327, "args": { "External id": 14560,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650476778.667, "dur": 11.060, "args": { "External id": 14561,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650476783.235, "dur": 6.103, "args": { "External id": 14562,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 8057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476787.032, "dur": 1.099, "args": { "External id": 14563,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650476795.999, "dur": 37.745, "args": { "External id": 14564,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476798.084, "dur": 2.314, "args": { "External id": 14565,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476801.698, "dur": 0.975, "args": { "External id": 14566,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476808.202, "dur": 0.897, "args": { "External id": 14567,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476812.541, "dur": 0.873, "args": { "External id": 14568,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476815.036, "dur": 0.702, "args": { "External id": 14569,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476817.303, "dur": 2.692, "args": { "External id": 14570,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476821.833, "dur": 0.826, "args": { "External id": 14571,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476823.662, "dur": 0.993, "args": { "External id": 14572,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650476828.664, "dur": 0.969, "args": { "External id": 14573,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650476846.928, "dur": 23.158, "args": { "External id": 14574,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8069 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650476931.433, "dur": 429.278, "args": { "External id": 14575,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 8070 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650476963.315, "dur": 390.861, "args": { "External id": 14576,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 8071, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650476973.796, "dur": 373.212, "args": { "External id": 14577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 8072 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650477389.330, "dur": 2.577, "args": { "External id": 14578,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 8073, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.26)", "pid": 1336757, "tid": 1336757, "ts": 1295650477487.753, "dur": 16881.499, "args": { "External id": 14579,"Record function id": 0, "Ev Idx": 8074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650477589.239, "dur": 6.735, "args": { "External id": 14580,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 8075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650477599.111, "dur": 1.471, "args": { "External id": 14581,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650477609.009, "dur": 1.188, "args": { "External id": 14582,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650477613.641, "dur": 1.253, "args": { "External id": 14583,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650477616.261, "dur": 1.033, "args": { "External id": 14584,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650477618.664, "dur": 1.320, "args": { "External id": 14585,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650477621.774, "dur": 1.109, "args": { "External id": 14586,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650477626.187, "dur": 2.025, "args": { "External id": 14587,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650477629.970, "dur": 1.382, "args": { "External id": 14588,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650477632.694, "dur": 0.936, "args": { "External id": 14589,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8084 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650477654.111, "dur": 16672.061, "args": { "External id": 14590,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650477670.735, "dur": 16647.186, "args": { "External id": 14591,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650477691.446, "dur": 14.063, "args": { "External id": 14592,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650477710.713, "dur": 16568.608, "args": { "External id": 14593,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 8088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650477713.422, "dur": 16564.974, "args": { "External id": 14594,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 8089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650477719.345, "dur": 5.887, "args": { "External id": 14595,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650477727.260, "dur": 16547.905, "args": { "External id": 14596,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 8091 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650494509.230, "dur": 38.108, "args": { "External id": 14597,"Sequence number": 246593, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 8092 } }, { "ph": "s", "id": 175, "pid": 1336757, "tid": 1336757, "ts": 1295650494509.230, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650494532.898, "dur": 9.651, "args": { "External id": 14598,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 8093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650494536.763, "dur": 5.585, "args": { "External id": 14599,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8094 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650494610.239, "dur": 81.114, "args": { "External id": 14600,"Record function id": 0, "Ev Idx": 8095 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650494692.762, "dur": 1149.825, "args": { "External id": 14601,"Record function id": 0, "Ev Idx": 8096 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650494732.544, "dur": 1095.256, "args": { "External id": 14602,"Sequence number": 246594, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 8097 } }, { "ph": "s", "id": 174, "pid": 1336757, "tid": 1336757, "ts": 1295650494732.544, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650494802.669, "dur": 43.742, "args": { "External id": 14603,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650494860.282, "dur": 105.940, "args": { "External id": 14604,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650494976.050, "dur": 80.995, "args": { "External id": 14605,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650495070.218, "dur": 33.187, "args": { "External id": 14606,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8101 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650495130.558, "dur": 31.380, "args": { "External id": 14607,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8102 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650495182.643, "dur": 16.908, "args": { "External id": 14608,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8103 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650495218.607, "dur": 174.488, "args": { "External id": 14609,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650495299.180, "dur": 17.172, "args": { "External id": 14610,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650495305.434, "dur": 9.548, "args": { "External id": 14611,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650495319.924, "dur": 7.070, "args": { "External id": 14612,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650495328.950, "dur": 2.140, "args": { "External id": 14613,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650495333.360, "dur": 4.363, "args": { "External id": 14614,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650495404.760, "dur": 54.496, "args": { "External id": 14615,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8110 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650495492.561, "dur": 29.745, "args": { "External id": 14616,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650495530.488, "dur": 42.138, "args": { "External id": 14617,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650495582.295, "dur": 35.520, "args": { "External id": 14618,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8113 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650495640.138, "dur": 27.902, "args": { "External id": 14619,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 8114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650495674.516, "dur": 36.742, "args": { "External id": 14620,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 8115 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650495733.709, "dur": 19.687, "args": { "External id": 14621,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 8116 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.26)", "pid": 1336757, "tid": 1336757, "ts": 1295650495908.584, "dur": 115.498, "args": { "External id": 14622,"Record function id": 0, "Ev Idx": 8117 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336757, "tid": 1336757, "ts": 1295650496105.189, "dur": 48.253, "args": { "External id": 14623,"Record function id": 0, "Ev Idx": 8118 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.27)", "pid": 1336757, "tid": 1336757, "ts": 1295650496163.310, "dur": 17973.637, "args": { "External id": 14624,"Record function id": 0, "Ev Idx": 8119 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.27)", "pid": 1336757, "tid": 1336757, "ts": 1295650496172.026, "dur": 947.232, "args": { "External id": 14625,"Record function id": 0, "Ev Idx": 8120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650496285.369, "dur": 12.851, "args": { "External id": 14626,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650496314.645, "dur": 48.735, "args": { "External id": 14627,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496320.699, "dur": 2.742, "args": { "External id": 14628,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496328.382, "dur": 0.692, "args": { "External id": 14629,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496330.520, "dur": 0.708, "args": { "External id": 14630,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496332.660, "dur": 0.654, "args": { "External id": 14631,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496336.980, "dur": 0.763, "args": { "External id": 14632,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496339.180, "dur": 0.895, "args": { "External id": 14633,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496341.339, "dur": 2.892, "args": { "External id": 14634,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496345.659, "dur": 0.849, "args": { "External id": 14635,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496347.756, "dur": 0.916, "args": { "External id": 14636,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650496377.350, "dur": 45.972, "args": { "External id": 14637,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8132 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336757, "tid": 1336757, "ts": 1295650496460.177, "dur": 118.649, "args": { "External id": 14638,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "4", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 8133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650496472.294, "dur": 5.764, "args": { "External id": 14639,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336757, "tid": 1336757, "ts": 1295650496483.435, "dur": 10.562, "args": { "External id": 14640,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650496487.953, "dur": 5.656, "args": { "External id": 14641,"Record function id": 0, "Concrete Inputs": ["", "0", "25692160", "32115200", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 8136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496491.469, "dur": 0.950, "args": { "External id": 14642,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336757, "tid": 1336757, "ts": 1295650496501.271, "dur": 31.591, "args": { "External id": 14643,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496503.229, "dur": 3.011, "args": { "External id": 14644,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "25692160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496507.776, "dur": 0.741, "args": { "External id": 14645,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "25692416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496510.288, "dur": 0.863, "args": { "External id": 14646,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26216704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496514.461, "dur": 0.761, "args": { "External id": 14647,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "26740992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496516.840, "dur": 0.529, "args": { "External id": 14648,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27265280"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496518.505, "dur": 0.575, "args": { "External id": 14649,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27789568"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496522.770, "dur": 0.643, "args": { "External id": 14650,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "27789824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496524.733, "dur": 0.680, "args": { "External id": 14651,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29231616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650496526.740, "dur": 2.589, "args": { "External id": 14652,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "30673408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650496548.505, "dur": 22.162, "args": { "External id": 14653,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8148 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336757, "tid": 1336757, "ts": 1295650496635.268, "dur": 381.161, "args": { "External id": 14654,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 8149 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650496667.822, "dur": 309.514, "args": { "External id": 14655,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 4, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 8150, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336757, "tid": 1336757, "ts": 1295650496678.454, "dur": 293.123, "args": { "External id": 14656,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 8151 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295650497043.404, "dur": 3.133, "args": { "External id": 14657,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 8152, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.27)", "pid": 1336757, "tid": 1336757, "ts": 1295650497140.451, "dur": 16750.667, "args": { "External id": 14658,"Record function id": 0, "Ev Idx": 8153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650497282.670, "dur": 7.371, "args": { "External id": 14659,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 8154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650497295.658, "dur": 2.111, "args": { "External id": 14660,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650497300.531, "dur": 1.641, "args": { "External id": 14661,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650497306.546, "dur": 1.510, "args": { "External id": 14662,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650497310.862, "dur": 1.548, "args": { "External id": 14663,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650497314.685, "dur": 1.742, "args": { "External id": 14664,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650497318.924, "dur": 1.000, "args": { "External id": 14665,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650497324.877, "dur": 2.256, "args": { "External id": 14666,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650497329.344, "dur": 1.263, "args": { "External id": 14667,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650497333.623, "dur": 1.193, "args": { "External id": 14668,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8163 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650497360.922, "dur": 16479.975, "args": { "External id": 14669,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650497381.207, "dur": 16450.934, "args": { "External id": 14670,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650497405.148, "dur": 16.829, "args": { "External id": 14671,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650497428.215, "dur": 16367.415, "args": { "External id": 14672,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 8167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650497431.239, "dur": 16363.571, "args": { "External id": 14673,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 8168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650497438.743, "dur": 8.154, "args": { "External id": 14674,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650497449.114, "dur": 16341.926, "args": { "External id": 14675,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 8170 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650514065.918, "dur": 43.219, "args": { "External id": 14676,"Sequence number": 246595, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 8171 } }, { "ph": "s", "id": 173, "pid": 1336757, "tid": 1336757, "ts": 1295650514065.918, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295650514085.628, "dur": 18.095, "args": { "External id": 14677,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 8172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650514096.965, "dur": 6.380, "args": { "External id": 14678,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8173 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650514178.999, "dur": 102.030, "args": { "External id": 14679,"Record function id": 0, "Ev Idx": 8174 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336757, "tid": 1336757, "ts": 1295650514285.307, "dur": 1161.443, "args": { "External id": 14680,"Record function id": 0, "Ev Idx": 8175 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650514335.272, "dur": 1096.746, "args": { "External id": 14681,"Sequence number": 246596, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 8176 } }, { "ph": "s", "id": 172, "pid": 1336757, "tid": 1336757, "ts": 1295650514335.272, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650514410.320, "dur": 50.578, "args": { "External id": 14682,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650514475.087, "dur": 109.077, "args": { "External id": 14683,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650514593.477, "dur": 38.822, "args": { "External id": 14684,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650514642.080, "dur": 31.903, "args": { "External id": 14685,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8180 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650514697.430, "dur": 27.770, "args": { "External id": 14686,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8181 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336757, "tid": 1336757, "ts": 1295650514746.049, "dur": 15.662, "args": { "External id": 14687,"kernel_hash": "ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/td/ctde6obw47lrxarntg442rinsuwlx4v7ftjlbooqhkhlhwhaksb4.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8182 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650514779.768, "dur": 129.083, "args": { "External id": 14688,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650514830.780, "dur": 12.229, "args": { "External id": 14689,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650514835.808, "dur": 6.331, "args": { "External id": 14690,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650514845.844, "dur": 4.818, "args": { "External id": 14691,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650514851.982, "dur": 2.206, "args": { "External id": 14692,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650514856.493, "dur": 3.242, "args": { "External id": 14693,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650514919.514, "dur": 44.180, "args": { "External id": 14694,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8189 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336757, "tid": 1336757, "ts": 1295650515035.236, "dur": 33.294, "args": { "External id": 14695,"kernel_hash": "cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/oh/cohoteac6vn6qlofk3ytbewriosbrre4g473qjud7syi7ayj7ymc.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650515079.698, "dur": 45.611, "args": { "External id": 14696,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650515135.040, "dur": 35.527, "args": { "External id": 14697,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8192 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336757, "tid": 1336757, "ts": 1295650515194.353, "dur": 27.148, "args": { "External id": 14698,"kernel_hash": "cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/qh/cqhqx2lwkkgnxczi2z4ew2shsidevhbk5pjz54fm6sbd6uftsmjf.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 8193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650515242.557, "dur": 51.478, "args": { "External id": 14699,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 8194 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336757, "tid": 1336757, "ts": 1295650515326.627, "dur": 26.395, "args": { "External id": 14700,"kernel_hash": "cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/qo/cqo6qtnieavgrnue4llkfxac3bydsk5p7r22potmkpxvtg3jxrsu.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 8195 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.27)", "pid": 1336757, "tid": 1336757, "ts": 1295650515516.869, "dur": 32.872, "args": { "External id": 14701,"Record function id": 0, "Ev Idx": 8196 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650515693.113, "dur": 284.713, "args": { "External id": 14702,"Sequence number": 246597, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8197 } }, { "ph": "s", "id": 171, "pid": 1336757, "tid": 1336757, "ts": 1295650515693.113, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650515725.100, "dur": 8.695, "args": { "External id": 14703,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650515727.292, "dur": 6.248, "args": { "External id": 14704,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650515745.238, "dur": 14.357, "args": { "External id": 14705,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650515748.889, "dur": 10.033, "args": { "External id": 14706,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650515769.420, "dur": 5.556, "args": { "External id": 14707,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650515957.721, "dur": 6.833, "args": { "External id": 14708,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650515961.431, "dur": 2.900, "args": { "External id": 14709,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650516047.350, "dur": 154.924, "args": { "External id": 14710,"Sequence number": 246598, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650516050.995, "dur": 18.352, "args": { "External id": 14711,"Sequence number": 246598, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8206 } }, { "ph": "s", "id": 170, "pid": 1336757, "tid": 1336757, "ts": 1295650516050.995, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650516057.529, "dur": 9.526, "args": { "External id": 14712,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650516064.109, "dur": 2.444, "args": { "External id": 14713,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650516071.735, "dur": 130.115, "args": { "External id": 14714,"Sequence number": 246599, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650516075.013, "dur": 5.651, "args": { "External id": 14715,"Sequence number": 246599, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650516076.103, "dur": 4.428, "args": { "External id": 14716,"Sequence number": 246599, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8211 } }, { "ph": "s", "id": 169, "pid": 1336757, "tid": 1336757, "ts": 1295650516076.103, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650516085.186, "dur": 106.199, "args": { "External id": 14717,"Sequence number": 246600, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8212 } }, { "ph": "s", "id": 168, "pid": 1336757, "tid": 1336757, "ts": 1295650516085.186, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650516195.241, "dur": 5.510, "args": { "External id": 14718,"Sequence number": 246601, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8213 } }, { "ph": "s", "id": 167, "pid": 1336757, "tid": 1336757, "ts": 1295650516195.241, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650516212.576, "dur": 113.999, "args": { "External id": 14719,"Sequence number": 246602, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650516213.667, "dur": 8.841, "args": { "External id": 14720,"Sequence number": 246602, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8215 } }, { "ph": "s", "id": 166, "pid": 1336757, "tid": 1336757, "ts": 1295650516213.667, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650516215.736, "dur": 5.333, "args": { "External id": 14721,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650516219.919, "dur": 0.947, "args": { "External id": 14722,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650516223.071, "dur": 103.258, "args": { "External id": 14723,"Sequence number": 246603, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650516224.176, "dur": 23.639, "args": { "External id": 14724,"Sequence number": 246603, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650516225.418, "dur": 21.618, "args": { "External id": 14725,"Sequence number": 246603, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8220 } }, { "ph": "s", "id": 165, "pid": 1336757, "tid": 1336757, "ts": 1295650516225.418, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650516249.499, "dur": 68.191, "args": { "External id": 14726,"Sequence number": 246604, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8221 } }, { "ph": "s", "id": 164, "pid": 1336757, "tid": 1336757, "ts": 1295650516249.499, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650516319.898, "dur": 5.738, "args": { "External id": 14727,"Sequence number": 246605, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8222 } }, { "ph": "s", "id": 163, "pid": 1336757, "tid": 1336757, "ts": 1295650516319.898, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650516338.030, "dur": 73.694, "args": { "External id": 14728,"Sequence number": 246606, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650516339.095, "dur": 6.802, "args": { "External id": 14729,"Sequence number": 246606, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8224 } }, { "ph": "s", "id": 162, "pid": 1336757, "tid": 1336757, "ts": 1295650516339.095, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650516341.933, "dur": 2.834, "args": { "External id": 14730,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650516343.514, "dur": 0.879, "args": { "External id": 14731,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650516349.080, "dur": 62.435, "args": { "External id": 14732,"Sequence number": 246607, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650516350.597, "dur": 5.381, "args": { "External id": 14733,"Sequence number": 246607, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650516351.749, "dur": 4.076, "args": { "External id": 14734,"Sequence number": 246607, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8229 } }, { "ph": "s", "id": 161, "pid": 1336757, "tid": 1336757, "ts": 1295650516351.749, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650516356.582, "dur": 45.478, "args": { "External id": 14735,"Sequence number": 246608, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8230 } }, { "ph": "s", "id": 160, "pid": 1336757, "tid": 1336757, "ts": 1295650516356.582, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650516403.843, "dur": 7.245, "args": { "External id": 14736,"Sequence number": 246609, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8231 } }, { "ph": "s", "id": 159, "pid": 1336757, "tid": 1336757, "ts": 1295650516403.843, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650516435.852, "dur": 4.820, "args": { "External id": 14737,"Sequence number": 246610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650516437.010, "dur": 3.489, "args": { "External id": 14738,"Sequence number": 246610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8233 } }, { "ph": "s", "id": 158, "pid": 1336757, "tid": 1336757, "ts": 1295650516437.010, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650516448.083, "dur": 3.798, "args": { "External id": 14739,"Sequence number": 246611, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650516449.640, "dur": 2.122, "args": { "External id": 14740,"Sequence number": 246611, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8235 } }, { "ph": "s", "id": 157, "pid": 1336757, "tid": 1336757, "ts": 1295650516449.640, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650516457.871, "dur": 5.803, "args": { "External id": 14741,"Sequence number": 246612, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650516459.274, "dur": 4.250, "args": { "External id": 14742,"Sequence number": 246612, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8237 } }, { "ph": "s", "id": 156, "pid": 1336757, "tid": 1336757, "ts": 1295650516459.274, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650516502.627, "dur": 190.985, "args": { "External id": 14743,"Sequence number": 246613, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8238 } }, { "ph": "s", "id": 155, "pid": 1336757, "tid": 1336757, "ts": 1295650516502.627, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650516528.620, "dur": 10.334, "args": { "External id": 14744,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650516532.329, "dur": 6.089, "args": { "External id": 14745,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8240 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650516706.467, "dur": 116.709, "args": { "External id": 14746,"Sequence number": 246614, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8241 } }, { "ph": "s", "id": 154, "pid": 1336757, "tid": 1336757, "ts": 1295650516706.467, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650516722.269, "dur": 8.036, "args": { "External id": 14747,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650516724.561, "dur": 5.319, "args": { "External id": 14748,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8243 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336757, "tid": 1336757, "ts": 1295650516853.286, "dur": 238.743, "args": { "External id": 14749,"Sequence number": 246615, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8244 } }, { "ph": "s", "id": 153, "pid": 1336757, "tid": 1336757, "ts": 1295650516853.286, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650516883.302, "dur": 174.164, "args": { "External id": 14750,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650516935.396, "dur": 7.671, "args": { "External id": 14751,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650516937.832, "dur": 4.590, "args": { "External id": 14752,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650516945.914, "dur": 5.058, "args": { "External id": 14753,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650516952.442, "dur": 1.720, "args": { "External id": 14754,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650516959.262, "dur": 3.293, "args": { "External id": 14755,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1336757, "ts": 1295650517074.906, "dur": 6.102, "args": { "External id": 14756,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650517098.329, "dur": 6.897, "args": { "External id": 14757,"Sequence number": 246616, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650517100.092, "dur": 5.014, "args": { "External id": 14758,"Sequence number": 246616, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8253 } }, { "ph": "s", "id": 152, "pid": 1336757, "tid": 1336757, "ts": 1295650517100.092, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650517123.805, "dur": 153.601, "args": { "External id": 14759,"Sequence number": 246617, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650517127.519, "dur": 9.346, "args": { "External id": 14760,"Sequence number": 246617, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8255 } }, { "ph": "s", "id": 151, "pid": 1336757, "tid": 1336757, "ts": 1295650517127.519, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650517130.611, "dur": 4.903, "args": { "External id": 14761,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650517133.248, "dur": 1.970, "args": { "External id": 14762,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650517138.685, "dur": 138.403, "args": { "External id": 14763,"Sequence number": 246618, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650517140.594, "dur": 11.457, "args": { "External id": 14764,"Sequence number": 246618, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650517143.757, "dur": 8.018, "args": { "External id": 14765,"Sequence number": 246618, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8260 } }, { "ph": "s", "id": 150, "pid": 1336757, "tid": 1336757, "ts": 1295650517143.757, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650517153.299, "dur": 111.031, "args": { "External id": 14766,"Sequence number": 246619, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8261 } }, { "ph": "s", "id": 149, "pid": 1336757, "tid": 1336757, "ts": 1295650517153.299, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650517268.830, "dur": 6.984, "args": { "External id": 14767,"Sequence number": 246620, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8262 } }, { "ph": "s", "id": 148, "pid": 1336757, "tid": 1336757, "ts": 1295650517268.830, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650517327.014, "dur": 249.384, "args": { "External id": 14768,"Sequence number": 246621, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8263 } }, { "ph": "s", "id": 147, "pid": 1336757, "tid": 1336757, "ts": 1295650517327.014, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650517356.312, "dur": 3.586, "args": { "External id": 14769,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650517357.401, "dur": 2.283, "args": { "External id": 14770,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336757, "tid": 1336757, "ts": 1295650517366.547, "dur": 3.930, "args": { "External id": 14771,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650517367.858, "dur": 2.507, "args": { "External id": 14772,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650517368.944, "dur": 1.320, "args": { "External id": 14773,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650517378.536, "dur": 12.041, "args": { "External id": 14774,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650517383.523, "dur": 6.654, "args": { "External id": 14775,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650517397.181, "dur": 4.307, "args": { "External id": 14776,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650517404.881, "dur": 3.325, "args": { "External id": 14777,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650517550.431, "dur": 3.800, "args": { "External id": 14778,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650517551.856, "dur": 2.126, "args": { "External id": 14779,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650517556.795, "dur": 2.285, "args": { "External id": 14780,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650517557.675, "dur": 1.313, "args": { "External id": 14781,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650517599.331, "dur": 108.532, "args": { "External id": 14782,"Sequence number": 246622, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650517600.861, "dur": 8.681, "args": { "External id": 14783,"Sequence number": 246622, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8278 } }, { "ph": "s", "id": 146, "pid": 1336757, "tid": 1336757, "ts": 1295650517600.861, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650517603.699, "dur": 4.473, "args": { "External id": 14784,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650517606.319, "dur": 1.536, "args": { "External id": 14785,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650517610.624, "dur": 96.812, "args": { "External id": 14786,"Sequence number": 246623, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650517614.086, "dur": 4.168, "args": { "External id": 14787,"Sequence number": 246623, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650517615.267, "dur": 2.836, "args": { "External id": 14788,"Sequence number": 246623, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8283 } }, { "ph": "s", "id": 145, "pid": 1336757, "tid": 1336757, "ts": 1295650517615.267, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650517618.995, "dur": 81.955, "args": { "External id": 14789,"Sequence number": 246624, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8284 } }, { "ph": "s", "id": 144, "pid": 1336757, "tid": 1336757, "ts": 1295650517618.995, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650517703.051, "dur": 3.750, "args": { "External id": 14790,"Sequence number": 246625, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8285 } }, { "ph": "s", "id": 143, "pid": 1336757, "tid": 1336757, "ts": 1295650517703.051, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650517717.316, "dur": 73.530, "args": { "External id": 14791,"Sequence number": 246626, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650517720.237, "dur": 6.548, "args": { "External id": 14792,"Sequence number": 246626, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8287 } }, { "ph": "s", "id": 142, "pid": 1336757, "tid": 1336757, "ts": 1295650517720.237, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650517722.478, "dur": 3.134, "args": { "External id": 14793,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650517724.298, "dur": 1.106, "args": { "External id": 14794,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650517727.538, "dur": 63.077, "args": { "External id": 14795,"Sequence number": 246627, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650517728.823, "dur": 9.354, "args": { "External id": 14796,"Sequence number": 246627, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650517732.277, "dur": 5.753, "args": { "External id": 14797,"Sequence number": 246627, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8292 } }, { "ph": "s", "id": 141, "pid": 1336757, "tid": 1336757, "ts": 1295650517732.277, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650517739.010, "dur": 44.999, "args": { "External id": 14798,"Sequence number": 246628, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8293 } }, { "ph": "s", "id": 140, "pid": 1336757, "tid": 1336757, "ts": 1295650517739.010, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650517785.613, "dur": 4.594, "args": { "External id": 14799,"Sequence number": 246629, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8294 } }, { "ph": "s", "id": 139, "pid": 1336757, "tid": 1336757, "ts": 1295650517785.613, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650517814.040, "dur": 162.637, "args": { "External id": 14800,"Sequence number": 246630, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8295 } }, { "ph": "s", "id": 138, "pid": 1336757, "tid": 1336757, "ts": 1295650517814.040, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650517860.375, "dur": 4.594, "args": { "External id": 14801,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650517902.827, "dur": 59.671, "args": { "External id": 14802,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650517903.350, "dur": 4.852, "args": { "External id": 14803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650517904.503, "dur": 2.975, "args": { "External id": 14804,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650517906.421, "dur": 0.895, "args": { "External id": 14805,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650517909.260, "dur": 52.921, "args": { "External id": 14806,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650517912.673, "dur": 2.588, "args": { "External id": 14807,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650517913.968, "dur": 1.136, "args": { "External id": 14808,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650517915.698, "dur": 42.490, "args": { "External id": 14809,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650517960.215, "dur": 1.267, "args": { "External id": 14810,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1336757, "ts": 1295650518023.610, "dur": 34.189, "args": { "External id": 14811,"Sequence number": 246631, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8306 } }, { "ph": "s", "id": 137, "pid": 1336757, "tid": 1336757, "ts": 1295650518023.610, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650518098.120, "dur": 232.684, "args": { "External id": 14812,"Sequence number": 246632, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8307 } }, { "ph": "s", "id": 136, "pid": 1336757, "tid": 1336757, "ts": 1295650518098.120, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650518120.649, "dur": 6.469, "args": { "External id": 14813,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650518124.330, "dur": 2.598, "args": { "External id": 14814,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650518134.929, "dur": 8.341, "args": { "External id": 14815,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650518138.024, "dur": 4.775, "args": { "External id": 14816,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650518148.847, "dur": 4.242, "args": { "External id": 14817,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650518306.317, "dur": 5.987, "args": { "External id": 14818,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650518308.294, "dur": 3.507, "args": { "External id": 14819,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650518353.901, "dur": 110.239, "args": { "External id": 14820,"Sequence number": 246633, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650518355.251, "dur": 11.786, "args": { "External id": 14821,"Sequence number": 246633, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8316 } }, { "ph": "s", "id": 135, "pid": 1336757, "tid": 1336757, "ts": 1295650518355.251, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650518360.566, "dur": 4.955, "args": { "External id": 14822,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650518363.116, "dur": 2.002, "args": { "External id": 14823,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650518368.310, "dur": 95.533, "args": { "External id": 14824,"Sequence number": 246634, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650518369.837, "dur": 6.291, "args": { "External id": 14825,"Sequence number": 246634, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650518372.856, "dur": 3.135, "args": { "External id": 14826,"Sequence number": 246634, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8321 } }, { "ph": "s", "id": 134, "pid": 1336757, "tid": 1336757, "ts": 1295650518372.856, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650518377.018, "dur": 80.234, "args": { "External id": 14827,"Sequence number": 246635, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8322 } }, { "ph": "s", "id": 133, "pid": 1336757, "tid": 1336757, "ts": 1295650518377.018, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650518459.389, "dur": 3.456, "args": { "External id": 14828,"Sequence number": 246636, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8323 } }, { "ph": "s", "id": 132, "pid": 1336757, "tid": 1336757, "ts": 1295650518459.389, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650518472.221, "dur": 70.954, "args": { "External id": 14829,"Sequence number": 246637, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650518472.905, "dur": 11.063, "args": { "External id": 14830,"Sequence number": 246637, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8325 } }, { "ph": "s", "id": 131, "pid": 1336757, "tid": 1336757, "ts": 1295650518472.905, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650518479.802, "dur": 2.865, "args": { "External id": 14831,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650518481.524, "dur": 0.984, "args": { "External id": 14832,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650518484.652, "dur": 58.323, "args": { "External id": 14833,"Sequence number": 246638, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650518485.731, "dur": 5.217, "args": { "External id": 14834,"Sequence number": 246638, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650518486.828, "dur": 3.968, "args": { "External id": 14835,"Sequence number": 246638, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8330 } }, { "ph": "s", "id": 130, "pid": 1336757, "tid": 1336757, "ts": 1295650518486.828, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650518492.060, "dur": 45.935, "args": { "External id": 14836,"Sequence number": 246639, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8331 } }, { "ph": "s", "id": 129, "pid": 1336757, "tid": 1336757, "ts": 1295650518492.060, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650518539.768, "dur": 2.763, "args": { "External id": 14837,"Sequence number": 246640, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8332 } }, { "ph": "s", "id": 128, "pid": 1336757, "tid": 1336757, "ts": 1295650518539.768, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650518551.061, "dur": 65.066, "args": { "External id": 14838,"Sequence number": 246641, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650518551.662, "dur": 9.778, "args": { "External id": 14839,"Sequence number": 246641, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8334 } }, { "ph": "s", "id": 127, "pid": 1336757, "tid": 1336757, "ts": 1295650518551.662, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650518553.442, "dur": 6.563, "args": { "External id": 14840,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650518556.995, "dur": 2.597, "args": { "External id": 14841,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650518561.978, "dur": 53.912, "args": { "External id": 14842,"Sequence number": 246642, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650518563.361, "dur": 4.482, "args": { "External id": 14843,"Sequence number": 246642, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650518564.166, "dur": 3.345, "args": { "External id": 14844,"Sequence number": 246642, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8339 } }, { "ph": "s", "id": 126, "pid": 1336757, "tid": 1336757, "ts": 1295650518564.166, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650518571.167, "dur": 38.334, "args": { "External id": 14845,"Sequence number": 246643, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8340 } }, { "ph": "s", "id": 125, "pid": 1336757, "tid": 1336757, "ts": 1295650518571.167, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650518611.229, "dur": 4.323, "args": { "External id": 14846,"Sequence number": 246644, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8341 } }, { "ph": "s", "id": 124, "pid": 1336757, "tid": 1336757, "ts": 1295650518611.229, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650518631.830, "dur": 4.512, "args": { "External id": 14847,"Sequence number": 246645, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650518633.053, "dur": 3.137, "args": { "External id": 14848,"Sequence number": 246645, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8343 } }, { "ph": "s", "id": 123, "pid": 1336757, "tid": 1336757, "ts": 1295650518633.053, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650518672.814, "dur": 8.464, "args": { "External id": 14849,"Sequence number": 246646, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650518676.085, "dur": 5.058, "args": { "External id": 14850,"Sequence number": 246646, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8345 } }, { "ph": "s", "id": 122, "pid": 1336757, "tid": 1336757, "ts": 1295650518676.085, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650518685.725, "dur": 4.833, "args": { "External id": 14851,"Sequence number": 246647, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650518686.683, "dur": 3.715, "args": { "External id": 14852,"Sequence number": 246647, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8347 } }, { "ph": "s", "id": 121, "pid": 1336757, "tid": 1336757, "ts": 1295650518686.683, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650518722.855, "dur": 169.191, "args": { "External id": 14853,"Sequence number": 246648, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8348 } }, { "ph": "s", "id": 120, "pid": 1336757, "tid": 1336757, "ts": 1295650518722.855, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650518744.962, "dur": 9.769, "args": { "External id": 14854,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650518748.200, "dur": 6.085, "args": { "External id": 14855,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8350 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650518907.032, "dur": 152.866, "args": { "External id": 14856,"Sequence number": 246649, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8351 } }, { "ph": "s", "id": 119, "pid": 1336757, "tid": 1336757, "ts": 1295650518907.032, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650518921.878, "dur": 7.580, "args": { "External id": 14857,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650518924.429, "dur": 4.590, "args": { "External id": 14858,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8353 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336757, "tid": 1336757, "ts": 1295650519090.811, "dur": 224.303, "args": { "External id": 14859,"Sequence number": 246650, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8354 } }, { "ph": "s", "id": 118, "pid": 1336757, "tid": 1336757, "ts": 1295650519090.811, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650519121.635, "dur": 156.819, "args": { "External id": 14860,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650519170.513, "dur": 9.623, "args": { "External id": 14861,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650519173.315, "dur": 6.213, "args": { "External id": 14862,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650519182.962, "dur": 4.457, "args": { "External id": 14863,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650519188.481, "dur": 3.254, "args": { "External id": 14864,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650519194.319, "dur": 3.755, "args": { "External id": 14865,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1336757, "ts": 1295650519294.067, "dur": 6.342, "args": { "External id": 14866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650519322.475, "dur": 9.489, "args": { "External id": 14867,"Sequence number": 246651, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650519324.256, "dur": 7.509, "args": { "External id": 14868,"Sequence number": 246651, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8363 } }, { "ph": "s", "id": 117, "pid": 1336757, "tid": 1336757, "ts": 1295650519324.256, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650519350.501, "dur": 120.436, "args": { "External id": 14869,"Sequence number": 246652, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650519351.981, "dur": 8.424, "args": { "External id": 14870,"Sequence number": 246652, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8365 } }, { "ph": "s", "id": 116, "pid": 1336757, "tid": 1336757, "ts": 1295650519351.981, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650519354.394, "dur": 4.917, "args": { "External id": 14871,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650519357.120, "dur": 1.879, "args": { "External id": 14872,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650519361.772, "dur": 108.875, "args": { "External id": 14873,"Sequence number": 246653, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650519365.838, "dur": 5.517, "args": { "External id": 14874,"Sequence number": 246653, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650519366.851, "dur": 4.367, "args": { "External id": 14875,"Sequence number": 246653, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8370 } }, { "ph": "s", "id": 115, "pid": 1336757, "tid": 1336757, "ts": 1295650519366.851, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650519372.393, "dur": 88.840, "args": { "External id": 14876,"Sequence number": 246654, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8371 } }, { "ph": "s", "id": 114, "pid": 1336757, "tid": 1336757, "ts": 1295650519372.393, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650519463.563, "dur": 6.194, "args": { "External id": 14877,"Sequence number": 246655, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8372 } }, { "ph": "s", "id": 113, "pid": 1336757, "tid": 1336757, "ts": 1295650519463.563, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650519508.641, "dur": 221.854, "args": { "External id": 14878,"Sequence number": 246656, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8373 } }, { "ph": "s", "id": 112, "pid": 1336757, "tid": 1336757, "ts": 1295650519508.641, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650519533.038, "dur": 2.939, "args": { "External id": 14879,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650519533.886, "dur": 1.907, "args": { "External id": 14880,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336757, "tid": 1336757, "ts": 1295650519539.808, "dur": 4.705, "args": { "External id": 14881,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650519540.745, "dur": 3.659, "args": { "External id": 14882,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650519543.217, "dur": 1.024, "args": { "External id": 14883,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650519552.968, "dur": 7.753, "args": { "External id": 14884,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650519555.321, "dur": 5.042, "args": { "External id": 14885,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650519567.240, "dur": 3.804, "args": { "External id": 14886,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650519574.249, "dur": 3.465, "args": { "External id": 14887,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650519706.446, "dur": 3.374, "args": { "External id": 14888,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650519707.562, "dur": 2.076, "args": { "External id": 14889,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650519714.567, "dur": 2.424, "args": { "External id": 14890,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650519715.635, "dur": 1.256, "args": { "External id": 14891,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650519750.137, "dur": 91.028, "args": { "External id": 14892,"Sequence number": 246657, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650519751.074, "dur": 6.971, "args": { "External id": 14893,"Sequence number": 246657, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8388 } }, { "ph": "s", "id": 111, "pid": 1336757, "tid": 1336757, "ts": 1295650519751.074, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650519752.975, "dur": 3.735, "args": { "External id": 14894,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650519754.871, "dur": 1.401, "args": { "External id": 14895,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650519760.777, "dur": 80.111, "args": { "External id": 14896,"Sequence number": 246658, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650519762.037, "dur": 3.599, "args": { "External id": 14897,"Sequence number": 246658, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650519763.052, "dur": 2.454, "args": { "External id": 14898,"Sequence number": 246658, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8393 } }, { "ph": "s", "id": 110, "pid": 1336757, "tid": 1336757, "ts": 1295650519763.052, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650519766.318, "dur": 67.358, "args": { "External id": 14899,"Sequence number": 246659, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8394 } }, { "ph": "s", "id": 109, "pid": 1336757, "tid": 1336757, "ts": 1295650519766.318, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650519835.825, "dur": 4.526, "args": { "External id": 14900,"Sequence number": 246660, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8395 } }, { "ph": "s", "id": 108, "pid": 1336757, "tid": 1336757, "ts": 1295650519835.825, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650519849.410, "dur": 69.432, "args": { "External id": 14901,"Sequence number": 246661, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650519850.171, "dur": 4.914, "args": { "External id": 14902,"Sequence number": 246661, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8397 } }, { "ph": "s", "id": 107, "pid": 1336757, "tid": 1336757, "ts": 1295650519850.171, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650519851.473, "dur": 2.460, "args": { "External id": 14903,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650519852.707, "dur": 1.049, "args": { "External id": 14904,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650519855.623, "dur": 62.982, "args": { "External id": 14905,"Sequence number": 246662, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650519859.031, "dur": 6.489, "args": { "External id": 14906,"Sequence number": 246662, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650519859.919, "dur": 5.428, "args": { "External id": 14907,"Sequence number": 246662, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8402 } }, { "ph": "s", "id": 106, "pid": 1336757, "tid": 1336757, "ts": 1295650519859.919, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650519866.105, "dur": 45.423, "args": { "External id": 14908,"Sequence number": 246663, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8403 } }, { "ph": "s", "id": 105, "pid": 1336757, "tid": 1336757, "ts": 1295650519866.105, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650519913.561, "dur": 4.657, "args": { "External id": 14909,"Sequence number": 246664, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8404 } }, { "ph": "s", "id": 104, "pid": 1336757, "tid": 1336757, "ts": 1295650519913.561, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650519940.660, "dur": 207.664, "args": { "External id": 14910,"Sequence number": 246665, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8405 } }, { "ph": "s", "id": 103, "pid": 1336757, "tid": 1336757, "ts": 1295650519940.660, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650519979.077, "dur": 4.275, "args": { "External id": 14911,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650520067.008, "dur": 66.349, "args": { "External id": 14912,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650520067.923, "dur": 6.462, "args": { "External id": 14913,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650520069.532, "dur": 3.702, "args": { "External id": 14914,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650520071.584, "dur": 1.301, "args": { "External id": 14915,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650520077.798, "dur": 55.193, "args": { "External id": 14916,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650520078.798, "dur": 2.392, "args": { "External id": 14917,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650520079.572, "dur": 1.465, "args": { "External id": 14918,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650520081.772, "dur": 46.921, "args": { "External id": 14919,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650520130.836, "dur": 1.244, "args": { "External id": 14920,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1336757, "ts": 1295650520157.623, "dur": 27.557, "args": { "External id": 14921,"Sequence number": 246666, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8416 } }, { "ph": "s", "id": 102, "pid": 1336757, "tid": 1336757, "ts": 1295650520157.623, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650520221.937, "dur": 227.491, "args": { "External id": 14922,"Sequence number": 246667, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8417 } }, { "ph": "s", "id": 101, "pid": 1336757, "tid": 1336757, "ts": 1295650520221.937, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650520267.467, "dur": 5.048, "args": { "External id": 14923,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650520268.911, "dur": 3.228, "args": { "External id": 14924,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650520282.411, "dur": 9.769, "args": { "External id": 14925,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650520285.688, "dur": 5.943, "args": { "External id": 14926,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650520299.528, "dur": 5.214, "args": { "External id": 14927,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650520429.449, "dur": 3.405, "args": { "External id": 14928,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650520430.579, "dur": 2.122, "args": { "External id": 14929,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650520469.516, "dur": 95.110, "args": { "External id": 14930,"Sequence number": 246668, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650520470.681, "dur": 8.035, "args": { "External id": 14931,"Sequence number": 246668, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8426 } }, { "ph": "s", "id": 100, "pid": 1336757, "tid": 1336757, "ts": 1295650520470.681, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650520473.503, "dur": 3.878, "args": { "External id": 14932,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650520475.506, "dur": 1.490, "args": { "External id": 14933,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650520479.874, "dur": 84.441, "args": { "External id": 14934,"Sequence number": 246669, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650520483.527, "dur": 3.928, "args": { "External id": 14935,"Sequence number": 246669, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650520484.512, "dur": 2.706, "args": { "External id": 14936,"Sequence number": 246669, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8431 } }, { "ph": "s", "id": 99, "pid": 1336757, "tid": 1336757, "ts": 1295650520484.512, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650520488.122, "dur": 68.060, "args": { "External id": 14937,"Sequence number": 246670, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8432 } }, { "ph": "s", "id": 98, "pid": 1336757, "tid": 1336757, "ts": 1295650520488.122, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650520558.193, "dur": 5.338, "args": { "External id": 14938,"Sequence number": 246671, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8433 } }, { "ph": "s", "id": 97, "pid": 1336757, "tid": 1336757, "ts": 1295650520558.193, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650520572.597, "dur": 62.104, "args": { "External id": 14939,"Sequence number": 246672, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650520575.136, "dur": 6.084, "args": { "External id": 14940,"Sequence number": 246672, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8435 } }, { "ph": "s", "id": 96, "pid": 1336757, "tid": 1336757, "ts": 1295650520575.136, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650520577.170, "dur": 2.747, "args": { "External id": 14941,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650520578.668, "dur": 1.063, "args": { "External id": 14942,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650520581.987, "dur": 52.531, "args": { "External id": 14943,"Sequence number": 246673, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650520582.664, "dur": 5.424, "args": { "External id": 14944,"Sequence number": 246673, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650520585.747, "dur": 2.220, "args": { "External id": 14945,"Sequence number": 246673, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8440 } }, { "ph": "s", "id": 95, "pid": 1336757, "tid": 1336757, "ts": 1295650520585.747, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650520588.520, "dur": 41.597, "args": { "External id": 14946,"Sequence number": 246674, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8441 } }, { "ph": "s", "id": 94, "pid": 1336757, "tid": 1336757, "ts": 1295650520588.520, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650520631.611, "dur": 2.583, "args": { "External id": 14947,"Sequence number": 246675, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8442 } }, { "ph": "s", "id": 93, "pid": 1336757, "tid": 1336757, "ts": 1295650520631.611, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650520641.335, "dur": 65.497, "args": { "External id": 14948,"Sequence number": 246676, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650520642.140, "dur": 8.827, "args": { "External id": 14949,"Sequence number": 246676, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8444 } }, { "ph": "s", "id": 92, "pid": 1336757, "tid": 1336757, "ts": 1295650520642.140, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650520645.248, "dur": 4.353, "args": { "External id": 14950,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650520646.379, "dur": 3.001, "args": { "External id": 14951,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650520651.528, "dur": 55.091, "args": { "External id": 14952,"Sequence number": 246677, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650520652.706, "dur": 6.285, "args": { "External id": 14953,"Sequence number": 246677, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650520655.734, "dur": 3.123, "args": { "External id": 14954,"Sequence number": 246677, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8449 } }, { "ph": "s", "id": 91, "pid": 1336757, "tid": 1336757, "ts": 1295650520655.734, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650520659.448, "dur": 41.173, "args": { "External id": 14955,"Sequence number": 246678, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8450 } }, { "ph": "s", "id": 90, "pid": 1336757, "tid": 1336757, "ts": 1295650520659.448, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650520702.148, "dur": 4.089, "args": { "External id": 14956,"Sequence number": 246679, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8451 } }, { "ph": "s", "id": 89, "pid": 1336757, "tid": 1336757, "ts": 1295650520702.148, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650520721.571, "dur": 5.175, "args": { "External id": 14957,"Sequence number": 246680, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650520722.188, "dur": 4.417, "args": { "External id": 14958,"Sequence number": 246680, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8453 } }, { "ph": "s", "id": 88, "pid": 1336757, "tid": 1336757, "ts": 1295650520722.188, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650520733.755, "dur": 3.671, "args": { "External id": 14959,"Sequence number": 246681, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650520735.111, "dur": 2.181, "args": { "External id": 14960,"Sequence number": 246681, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8455 } }, { "ph": "s", "id": 87, "pid": 1336757, "tid": 1336757, "ts": 1295650520735.111, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650520741.560, "dur": 3.120, "args": { "External id": 14961,"Sequence number": 246682, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650520742.407, "dur": 2.147, "args": { "External id": 14962,"Sequence number": 246682, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8457 } }, { "ph": "s", "id": 86, "pid": 1336757, "tid": 1336757, "ts": 1295650520742.407, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650520773.658, "dur": 152.759, "args": { "External id": 14963,"Sequence number": 246683, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8458 } }, { "ph": "s", "id": 85, "pid": 1336757, "tid": 1336757, "ts": 1295650520773.658, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650520795.574, "dur": 10.033, "args": { "External id": 14964,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650520797.763, "dur": 7.408, "args": { "External id": 14965,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8460 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650520939.206, "dur": 159.020, "args": { "External id": 14966,"Sequence number": 246684, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8461 } }, { "ph": "s", "id": 84, "pid": 1336757, "tid": 1336757, "ts": 1295650520939.206, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650520953.839, "dur": 7.969, "args": { "External id": 14967,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650520956.129, "dur": 5.317, "args": { "External id": 14968,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8463 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336757, "tid": 1336757, "ts": 1295650521130.825, "dur": 228.295, "args": { "External id": 14969,"Sequence number": 246685, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8464 } }, { "ph": "s", "id": 83, "pid": 1336757, "tid": 1336757, "ts": 1295650521130.825, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650521156.911, "dur": 167.291, "args": { "External id": 14970,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650521205.893, "dur": 9.240, "args": { "External id": 14971,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650521208.622, "dur": 5.678, "args": { "External id": 14972,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650521217.833, "dur": 4.576, "args": { "External id": 14973,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650521223.594, "dur": 1.612, "args": { "External id": 14974,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650521244.892, "dur": 6.145, "args": { "External id": 14975,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1336757, "ts": 1295650521339.216, "dur": 6.389, "args": { "External id": 14976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650521365.474, "dur": 7.980, "args": { "External id": 14977,"Sequence number": 246686, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650521367.892, "dur": 5.386, "args": { "External id": 14978,"Sequence number": 246686, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8473 } }, { "ph": "s", "id": 82, "pid": 1336757, "tid": 1336757, "ts": 1295650521367.892, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650521388.574, "dur": 144.097, "args": { "External id": 14979,"Sequence number": 246687, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650521390.019, "dur": 13.069, "args": { "External id": 14980,"Sequence number": 246687, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8475 } }, { "ph": "s", "id": 81, "pid": 1336757, "tid": 1336757, "ts": 1295650521390.019, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650521395.120, "dur": 6.866, "args": { "External id": 14981,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650521400.091, "dur": 1.606, "args": { "External id": 14982,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650521404.626, "dur": 127.721, "args": { "External id": 14983,"Sequence number": 246688, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650521406.516, "dur": 3.587, "args": { "External id": 14984,"Sequence number": 246688, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650521407.340, "dur": 2.657, "args": { "External id": 14985,"Sequence number": 246688, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8480 } }, { "ph": "s", "id": 80, "pid": 1336757, "tid": 1336757, "ts": 1295650521407.340, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650521411.003, "dur": 111.355, "args": { "External id": 14986,"Sequence number": 246689, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8481 } }, { "ph": "s", "id": 79, "pid": 1336757, "tid": 1336757, "ts": 1295650521411.003, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650521524.959, "dur": 6.496, "args": { "External id": 14987,"Sequence number": 246690, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8482 } }, { "ph": "s", "id": 78, "pid": 1336757, "tid": 1336757, "ts": 1295650521524.959, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650521571.308, "dur": 221.526, "args": { "External id": 14988,"Sequence number": 246691, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8483 } }, { "ph": "s", "id": 77, "pid": 1336757, "tid": 1336757, "ts": 1295650521571.308, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650521591.224, "dur": 3.072, "args": { "External id": 14989,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650521592.267, "dur": 1.892, "args": { "External id": 14990,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336757, "tid": 1336757, "ts": 1295650521598.017, "dur": 6.337, "args": { "External id": 14991,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650521602.279, "dur": 1.971, "args": { "External id": 14992,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650521602.865, "dur": 1.220, "args": { "External id": 14993,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650521612.689, "dur": 8.365, "args": { "External id": 14994,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650521614.625, "dur": 6.106, "args": { "External id": 14995,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650521627.162, "dur": 3.594, "args": { "External id": 14996,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650521634.232, "dur": 3.969, "args": { "External id": 14997,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650521771.044, "dur": 3.225, "args": { "External id": 14998,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650521772.051, "dur": 1.992, "args": { "External id": 14999,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650521776.896, "dur": 2.295, "args": { "External id": 15000,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650521777.794, "dur": 1.297, "args": { "External id": 15001,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650521810.831, "dur": 109.761, "args": { "External id": 15002,"Sequence number": 246692, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650521821.295, "dur": 9.734, "args": { "External id": 15003,"Sequence number": 246692, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8498 } }, { "ph": "s", "id": 76, "pid": 1336757, "tid": 1336757, "ts": 1295650521821.295, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650521826.030, "dur": 3.795, "args": { "External id": 15004,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650521828.057, "dur": 1.475, "args": { "External id": 15005,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650521831.889, "dur": 88.427, "args": { "External id": 15006,"Sequence number": 246693, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650521833.356, "dur": 7.229, "args": { "External id": 15007,"Sequence number": 246693, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650521834.214, "dur": 6.158, "args": { "External id": 15008,"Sequence number": 246693, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8503 } }, { "ph": "s", "id": 75, "pid": 1336757, "tid": 1336757, "ts": 1295650521834.214, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650521841.303, "dur": 68.923, "args": { "External id": 15009,"Sequence number": 246694, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8504 } }, { "ph": "s", "id": 74, "pid": 1336757, "tid": 1336757, "ts": 1295650521841.303, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650521912.076, "dur": 7.651, "args": { "External id": 15010,"Sequence number": 246695, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8505 } }, { "ph": "s", "id": 73, "pid": 1336757, "tid": 1336757, "ts": 1295650521912.076, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650521929.327, "dur": 116.452, "args": { "External id": 15011,"Sequence number": 246696, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650521930.068, "dur": 8.357, "args": { "External id": 15012,"Sequence number": 246696, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8507 } }, { "ph": "s", "id": 72, "pid": 1336757, "tid": 1336757, "ts": 1295650521930.068, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650521931.907, "dur": 5.207, "args": { "External id": 15013,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650521935.780, "dur": 1.138, "args": { "External id": 15014,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650521938.913, "dur": 106.634, "args": { "External id": 15015,"Sequence number": 246697, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650521940.199, "dur": 4.498, "args": { "External id": 15016,"Sequence number": 246697, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650521940.775, "dur": 3.779, "args": { "External id": 15017,"Sequence number": 246697, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8512 } }, { "ph": "s", "id": 71, "pid": 1336757, "tid": 1336757, "ts": 1295650521940.775, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650521947.475, "dur": 90.097, "args": { "External id": 15018,"Sequence number": 246698, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8513 } }, { "ph": "s", "id": 70, "pid": 1336757, "tid": 1336757, "ts": 1295650521947.475, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650522040.867, "dur": 4.045, "args": { "External id": 15019,"Sequence number": 246699, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8514 } }, { "ph": "s", "id": 69, "pid": 1336757, "tid": 1336757, "ts": 1295650522040.867, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650522070.142, "dur": 175.862, "args": { "External id": 15020,"Sequence number": 246700, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8515 } }, { "ph": "s", "id": 68, "pid": 1336757, "tid": 1336757, "ts": 1295650522070.142, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650522109.223, "dur": 5.387, "args": { "External id": 15021,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650522149.383, "dur": 63.661, "args": { "External id": 15022,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650522150.222, "dur": 5.939, "args": { "External id": 15023,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650522151.346, "dur": 3.820, "args": { "External id": 15024,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650522153.924, "dur": 1.030, "args": { "External id": 15025,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650522157.098, "dur": 55.636, "args": { "External id": 15026,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650522158.341, "dur": 2.239, "args": { "External id": 15027,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650522159.134, "dur": 1.290, "args": { "External id": 15028,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650522163.307, "dur": 45.596, "args": { "External id": 15029,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650522210.818, "dur": 1.323, "args": { "External id": 15030,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1336757, "ts": 1295650522259.675, "dur": 37.670, "args": { "External id": 15031,"Sequence number": 246701, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8526 } }, { "ph": "s", "id": 67, "pid": 1336757, "tid": 1336757, "ts": 1295650522259.675, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650522342.867, "dur": 199.809, "args": { "External id": 15032,"Sequence number": 246702, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8527 } }, { "ph": "s", "id": 66, "pid": 1336757, "tid": 1336757, "ts": 1295650522342.867, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650522365.023, "dur": 4.524, "args": { "External id": 15033,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650522366.518, "dur": 2.753, "args": { "External id": 15034,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650522381.440, "dur": 10.012, "args": { "External id": 15035,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650522386.191, "dur": 4.781, "args": { "External id": 15036,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650522402.327, "dur": 5.870, "args": { "External id": 15037,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650522529.380, "dur": 3.131, "args": { "External id": 15038,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650522530.312, "dur": 2.038, "args": { "External id": 15039,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650522562.318, "dur": 98.825, "args": { "External id": 15040,"Sequence number": 246703, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650522563.477, "dur": 10.403, "args": { "External id": 15041,"Sequence number": 246703, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8536 } }, { "ph": "s", "id": 65, "pid": 1336757, "tid": 1336757, "ts": 1295650522563.477, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650522566.091, "dur": 6.479, "args": { "External id": 15042,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650522570.685, "dur": 1.626, "args": { "External id": 15043,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650522574.898, "dur": 85.958, "args": { "External id": 15044,"Sequence number": 246704, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650522576.374, "dur": 3.964, "args": { "External id": 15045,"Sequence number": 246704, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650522577.151, "dur": 3.009, "args": { "External id": 15046,"Sequence number": 246704, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8541 } }, { "ph": "s", "id": 64, "pid": 1336757, "tid": 1336757, "ts": 1295650522577.151, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650522583.308, "dur": 71.154, "args": { "External id": 15047,"Sequence number": 246705, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8542 } }, { "ph": "s", "id": 63, "pid": 1336757, "tid": 1336757, "ts": 1295650522583.308, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650522656.603, "dur": 3.399, "args": { "External id": 15048,"Sequence number": 246706, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8543 } }, { "ph": "s", "id": 62, "pid": 1336757, "tid": 1336757, "ts": 1295650522656.603, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650522669.486, "dur": 67.864, "args": { "External id": 15049,"Sequence number": 246707, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650522670.186, "dur": 9.529, "args": { "External id": 15050,"Sequence number": 246707, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8545 } }, { "ph": "s", "id": 61, "pid": 1336757, "tid": 1336757, "ts": 1295650522670.186, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650522671.535, "dur": 6.711, "args": { "External id": 15051,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650522674.951, "dur": 3.079, "args": { "External id": 15052,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650522680.519, "dur": 56.556, "args": { "External id": 15053,"Sequence number": 246708, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650522681.403, "dur": 3.381, "args": { "External id": 15054,"Sequence number": 246708, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650522682.226, "dur": 2.427, "args": { "External id": 15055,"Sequence number": 246708, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8550 } }, { "ph": "s", "id": 60, "pid": 1336757, "tid": 1336757, "ts": 1295650522682.226, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650522685.273, "dur": 42.818, "args": { "External id": 15056,"Sequence number": 246709, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8551 } }, { "ph": "s", "id": 59, "pid": 1336757, "tid": 1336757, "ts": 1295650522685.273, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650522729.821, "dur": 6.833, "args": { "External id": 15057,"Sequence number": 246710, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8552 } }, { "ph": "s", "id": 58, "pid": 1336757, "tid": 1336757, "ts": 1295650522729.821, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650522743.678, "dur": 60.272, "args": { "External id": 15058,"Sequence number": 246711, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650522744.324, "dur": 5.324, "args": { "External id": 15059,"Sequence number": 246711, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8554 } }, { "ph": "s", "id": 57, "pid": 1336757, "tid": 1336757, "ts": 1295650522744.324, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650522745.961, "dur": 2.647, "args": { "External id": 15060,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650522747.488, "dur": 0.945, "args": { "External id": 15061,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650522752.068, "dur": 51.661, "args": { "External id": 15062,"Sequence number": 246712, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650522753.020, "dur": 4.117, "args": { "External id": 15063,"Sequence number": 246712, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650522753.620, "dur": 3.402, "args": { "External id": 15064,"Sequence number": 246712, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8559 } }, { "ph": "s", "id": 56, "pid": 1336757, "tid": 1336757, "ts": 1295650522753.620, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650522757.595, "dur": 40.400, "args": { "External id": 15065,"Sequence number": 246713, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8560 } }, { "ph": "s", "id": 55, "pid": 1336757, "tid": 1336757, "ts": 1295650522757.595, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650522799.675, "dur": 3.736, "args": { "External id": 15066,"Sequence number": 246714, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8561 } }, { "ph": "s", "id": 54, "pid": 1336757, "tid": 1336757, "ts": 1295650522799.675, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650522818.954, "dur": 3.731, "args": { "External id": 15067,"Sequence number": 246715, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650522819.717, "dur": 2.844, "args": { "External id": 15068,"Sequence number": 246715, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8563 } }, { "ph": "s", "id": 53, "pid": 1336757, "tid": 1336757, "ts": 1295650522819.717, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650522829.165, "dur": 3.451, "args": { "External id": 15069,"Sequence number": 246716, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650522830.524, "dur": 1.952, "args": { "External id": 15070,"Sequence number": 246716, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8565 } }, { "ph": "s", "id": 52, "pid": 1336757, "tid": 1336757, "ts": 1295650522830.524, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650522838.487, "dur": 4.980, "args": { "External id": 15071,"Sequence number": 246717, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650522839.275, "dur": 4.033, "args": { "External id": 15072,"Sequence number": 246717, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8567 } }, { "ph": "s", "id": 51, "pid": 1336757, "tid": 1336757, "ts": 1295650522839.275, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650522870.848, "dur": 178.935, "args": { "External id": 15073,"Sequence number": 246718, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8568 } }, { "ph": "s", "id": 50, "pid": 1336757, "tid": 1336757, "ts": 1295650522870.848, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650522889.116, "dur": 7.227, "args": { "External id": 15074,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650522891.354, "dur": 4.541, "args": { "External id": 15075,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8570 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650523064.276, "dur": 115.373, "args": { "External id": 15076,"Sequence number": 246719, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8571 } }, { "ph": "s", "id": 49, "pid": 1336757, "tid": 1336757, "ts": 1295650523064.276, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650523078.945, "dur": 8.830, "args": { "External id": 15077,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650523081.546, "dur": 5.778, "args": { "External id": 15078,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8573 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336757, "tid": 1336757, "ts": 1295650523206.850, "dur": 229.429, "args": { "External id": 15079,"Sequence number": 246720, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8574 } }, { "ph": "s", "id": 48, "pid": 1336757, "tid": 1336757, "ts": 1295650523206.850, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650523254.760, "dur": 151.608, "args": { "External id": 15080,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650523318.248, "dur": 12.195, "args": { "External id": 15081,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650523322.667, "dur": 7.128, "args": { "External id": 15082,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650523333.248, "dur": 5.178, "args": { "External id": 15083,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650523339.669, "dur": 3.462, "args": { "External id": 15084,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650523345.818, "dur": 3.170, "args": { "External id": 15085,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336757, "tid": 1336757, "ts": 1295650523418.022, "dur": 6.059, "args": { "External id": 15086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650523441.557, "dur": 6.314, "args": { "External id": 15087,"Sequence number": 246721, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650523443.061, "dur": 4.633, "args": { "External id": 15088,"Sequence number": 246721, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8583 } }, { "ph": "s", "id": 47, "pid": 1336757, "tid": 1336757, "ts": 1295650523443.061, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650523463.013, "dur": 118.887, "args": { "External id": 15089,"Sequence number": 246722, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650523466.567, "dur": 9.195, "args": { "External id": 15090,"Sequence number": 246722, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8585 } }, { "ph": "s", "id": 46, "pid": 1336757, "tid": 1336757, "ts": 1295650523466.567, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650523469.270, "dur": 5.274, "args": { "External id": 15091,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650523472.378, "dur": 1.789, "args": { "External id": 15092,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650523476.930, "dur": 104.576, "args": { "External id": 15093,"Sequence number": 246723, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650523478.879, "dur": 6.908, "args": { "External id": 15094,"Sequence number": 246723, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650523483.123, "dur": 2.480, "args": { "External id": 15095,"Sequence number": 246723, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8590 } }, { "ph": "s", "id": 45, "pid": 1336757, "tid": 1336757, "ts": 1295650523483.123, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650523486.864, "dur": 86.681, "args": { "External id": 15096,"Sequence number": 246724, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8591 } }, { "ph": "s", "id": 44, "pid": 1336757, "tid": 1336757, "ts": 1295650523486.864, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650523576.346, "dur": 4.267, "args": { "External id": 15097,"Sequence number": 246725, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8592 } }, { "ph": "s", "id": 43, "pid": 1336757, "tid": 1336757, "ts": 1295650523576.346, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650523617.131, "dur": 216.511, "args": { "External id": 15098,"Sequence number": 246726, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8593 } }, { "ph": "s", "id": 42, "pid": 1336757, "tid": 1336757, "ts": 1295650523617.131, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650523638.139, "dur": 3.409, "args": { "External id": 15099,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650523639.303, "dur": 2.032, "args": { "External id": 15100,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336757, "tid": 1336757, "ts": 1295650523645.565, "dur": 3.499, "args": { "External id": 15101,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650523646.649, "dur": 2.305, "args": { "External id": 15102,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650523647.404, "dur": 1.386, "args": { "External id": 15103,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650523656.399, "dur": 9.551, "args": { "External id": 15104,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650523660.635, "dur": 4.904, "args": { "External id": 15105,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650523672.081, "dur": 3.384, "args": { "External id": 15106,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650523678.843, "dur": 4.649, "args": { "External id": 15107,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650523812.127, "dur": 3.266, "args": { "External id": 15108,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650523813.416, "dur": 1.682, "args": { "External id": 15109,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650523817.841, "dur": 2.350, "args": { "External id": 15110,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650523819.023, "dur": 1.064, "args": { "External id": 15111,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650523852.861, "dur": 95.180, "args": { "External id": 15112,"Sequence number": 246727, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650523853.796, "dur": 8.879, "args": { "External id": 15113,"Sequence number": 246727, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8608 } }, { "ph": "s", "id": 41, "pid": 1336757, "tid": 1336757, "ts": 1295650523853.796, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650523855.867, "dur": 5.410, "args": { "External id": 15114,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650523857.808, "dur": 3.124, "args": { "External id": 15115,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650523863.805, "dur": 83.908, "args": { "External id": 15116,"Sequence number": 246728, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650523865.778, "dur": 5.432, "args": { "External id": 15117,"Sequence number": 246728, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650523868.676, "dur": 2.204, "args": { "External id": 15118,"Sequence number": 246728, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8613 } }, { "ph": "s", "id": 40, "pid": 1336757, "tid": 1336757, "ts": 1295650523868.676, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650523872.057, "dur": 67.380, "args": { "External id": 15119,"Sequence number": 246729, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8614 } }, { "ph": "s", "id": 39, "pid": 1336757, "tid": 1336757, "ts": 1295650523872.057, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650523941.614, "dur": 5.474, "args": { "External id": 15120,"Sequence number": 246730, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8615 } }, { "ph": "s", "id": 38, "pid": 1336757, "tid": 1336757, "ts": 1295650523941.614, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650523956.646, "dur": 125.935, "args": { "External id": 15121,"Sequence number": 246731, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650523957.345, "dur": 10.369, "args": { "External id": 15122,"Sequence number": 246731, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8617 } }, { "ph": "s", "id": 37, "pid": 1336757, "tid": 1336757, "ts": 1295650523957.345, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650523963.047, "dur": 2.885, "args": { "External id": 15123,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650523964.618, "dur": 0.926, "args": { "External id": 15124,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650523968.568, "dur": 113.749, "args": { "External id": 15125,"Sequence number": 246732, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650523969.369, "dur": 6.675, "args": { "External id": 15126,"Sequence number": 246732, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650523972.459, "dur": 3.472, "args": { "External id": 15127,"Sequence number": 246732, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8622 } }, { "ph": "s", "id": 36, "pid": 1336757, "tid": 1336757, "ts": 1295650523972.459, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650523976.532, "dur": 95.880, "args": { "External id": 15128,"Sequence number": 246733, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8623 } }, { "ph": "s", "id": 35, "pid": 1336757, "tid": 1336757, "ts": 1295650523976.532, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650524075.683, "dur": 6.069, "args": { "External id": 15129,"Sequence number": 246734, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8624 } }, { "ph": "s", "id": 34, "pid": 1336757, "tid": 1336757, "ts": 1295650524075.683, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650524106.036, "dur": 188.825, "args": { "External id": 15130,"Sequence number": 246735, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8625 } }, { "ph": "s", "id": 33, "pid": 1336757, "tid": 1336757, "ts": 1295650524106.036, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650524147.603, "dur": 5.353, "args": { "External id": 15131,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650524185.299, "dur": 91.635, "args": { "External id": 15132,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650524186.326, "dur": 7.720, "args": { "External id": 15133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650524187.911, "dur": 5.088, "args": { "External id": 15134,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524189.803, "dur": 2.988, "args": { "External id": 15135,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650524195.085, "dur": 81.352, "args": { "External id": 15136,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336757, "tid": 1336757, "ts": 1295650524197.234, "dur": 4.500, "args": { "External id": 15137,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650524200.343, "dur": 1.242, "args": { "External id": 15138,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650524202.585, "dur": 66.497, "args": { "External id": 15139,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336757, "tid": 1336757, "ts": 1295650524273.372, "dur": 1.909, "args": { "External id": 15140,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1336757, "ts": 1295650524306.813, "dur": 31.604, "args": { "External id": 15141,"Sequence number": 246736, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8636 } }, { "ph": "s", "id": 32, "pid": 1336757, "tid": 1336757, "ts": 1295650524306.813, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 1336757, "tid": 1336757, "ts": 1295650524359.237, "dur": 46.057, "args": { "External id": 15142,"Sequence number": 246737, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "-2"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[[8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1]], []], "Input Dims": [[[16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048]], []], "Ev Idx": 8637 } }, { "ph": "s", "id": 31, "pid": 1336757, "tid": 1336757, "ts": 1295650524359.237, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::cat", "pid": 1336757, "tid": 1336757, "ts": 1295650524370.021, "dur": 30.486, "args": { "External id": 15143,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[[8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1]], []], "Input Dims": [[[16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048]], []], "Ev Idx": 8638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650524402.091, "dur": 1.406, "args": { "External id": 15144,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 8192], []], "Ev Idx": 8639 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336757, "tid": 1336757, "ts": 1295650524444.756, "dur": 50.822, "args": { "External id": 15145,"Record function id": 0, "Ev Idx": 8640 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 2/0", "pid": 1336757, "tid": 1336757, "ts": 1295650524496.841, "dur": 196.004, "args": { "External id": 15146,"Record function id": 0, "Ev Idx": 8641 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650524537.339, "dur": 146.861, "args": { "External id": 15147,"Sequence number": 246738, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1], [33554432, 8192, 2048, 1]], "Input Dims": [[2048], [16, 4096, 4, 2048]], "Ev Idx": 8642 } }, { "ph": "s", "id": 30, "pid": 1336757, "tid": 1336757, "ts": 1295650524537.339, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336757, "tid": 1336757, "ts": 1295650524610.169, "dur": 36.147, "args": { "External id": 15148,"kernel_hash": "cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/fm/cfm353rsfwkbkca5jmv2fnid3xh6d36yeu3b4ybp4yeabcp47toh.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[262144, 2048], [262144, 2048], [2048], [262144], [], [], [], [], [], [], [], [], []], "Ev Idx": 8643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1336757, "ts": 1295650524782.408, "dur": 38.558, "args": { "External id": 15149,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650524785.275, "dur": 5.131, "args": { "External id": 15150,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650524793.393, "dur": 27.271, "args": { "External id": 15151,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 8646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650524796.845, "dur": 22.925, "args": { "External id": 15152,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1336757, "ts": 1295650524825.639, "dur": 19.201, "args": { "External id": 15153,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650524826.388, "dur": 3.208, "args": { "External id": 15154,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650524832.318, "dur": 12.258, "args": { "External id": 15155,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 8650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650524833.068, "dur": 11.104, "args": { "External id": 15156,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1336757, "ts": 1295650524848.023, "dur": 16.351, "args": { "External id": 15157,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650524848.759, "dur": 2.671, "args": { "External id": 15158,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650524852.155, "dur": 11.946, "args": { "External id": 15159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 8654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650524852.670, "dur": 11.131, "args": { "External id": 15160,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650524874.518, "dur": 0.728, "args": { "External id": 15161,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], [], []], "Ev Idx": 8656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 1336757, "tid": 1336757, "ts": 1295650524884.713, "dur": 11.213, "args": { "External id": 15162,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "5", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 8657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524892.179, "dur": 2.074, "args": { "External id": 15163,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 8658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650524902.455, "dur": 6.700, "args": { "External id": 15164,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 8659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524906.537, "dur": 1.032, "args": { "External id": 15165,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 8660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650524910.304, "dur": 3.454, "args": { "External id": 15166,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 8661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524912.172, "dur": 0.879, "args": { "External id": 15167,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 8662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650524915.097, "dur": 3.317, "args": { "External id": 15168,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "1", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 8663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524916.967, "dur": 0.899, "args": { "External id": 15169,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 8664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650524921.280, "dur": 3.104, "args": { "External id": 15170,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 4], [], [], [], []], "Ev Idx": 8665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524923.297, "dur": 0.500, "args": { "External id": 15171,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 4], [], [], []], "Ev Idx": 8666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650524925.528, "dur": 3.186, "args": { "External id": 15172,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "4096", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 4], [], [], [], []], "Ev Idx": 8667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524927.424, "dur": 0.601, "args": { "External id": 15173,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 4], [], [], []], "Ev Idx": 8668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650524929.609, "dur": 3.255, "args": { "External id": 15174,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4096, 4], [], [], [], []], "Ev Idx": 8669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524931.548, "dur": 0.769, "args": { "External id": 15175,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4096, 4], [], [], []], "Ev Idx": 8670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650524936.959, "dur": 5.676, "args": { "External id": 15176,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "2"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4096, 4], [], []], "Ev Idx": 8671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524941.152, "dur": 0.696, "args": { "External id": 15177,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4096, 4], [], [], []], "Ev Idx": 8672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650524946.431, "dur": 3.352, "args": { "External id": 15178,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 8673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524948.276, "dur": 0.924, "args": { "External id": 15179,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 8674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1336757, "ts": 1295650524956.023, "dur": 7.102, "args": { "External id": 15180,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 8675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524961.317, "dur": 0.773, "args": { "External id": 15181,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 8676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650524964.260, "dur": 3.159, "args": { "External id": 15182,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 8677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524965.988, "dur": 0.833, "args": { "External id": 15183,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 8678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650524969.919, "dur": 7.688, "args": { "External id": 15184,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 8679 } }, { "ph": "s", "id": 29, "pid": 1336757, "tid": 1336757, "ts": 1295650524969.919, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524975.055, "dur": 1.206, "args": { "External id": 15185,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 8680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650524978.814, "dur": 5.205, "args": { "External id": 15186,"Sequence number": 246740, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 8681 } }, { "ph": "s", "id": 28, "pid": 1336757, "tid": 1336757, "ts": 1295650524978.814, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650524982.414, "dur": 0.837, "args": { "External id": 15187,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 8682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1336757, "ts": 1295650525023.994, "dur": 9.766, "args": { "External id": 15188,"Sequence number": 246741, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 8683 } }, { "ph": "s", "id": 27, "pid": 1336757, "tid": 1336757, "ts": 1295650525023.994, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650525030.421, "dur": 1.609, "args": { "External id": 15189,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 8684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650525035.038, "dur": 6.988, "args": { "External id": 15190,"Sequence number": 246742, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 8685 } }, { "ph": "s", "id": 26, "pid": 1336757, "tid": 1336757, "ts": 1295650525035.038, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650525038.474, "dur": 2.595, "args": { "External id": 15191,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 8686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1336757, "ts": 1295650525047.708, "dur": 44.230, "args": { "External id": 15192,"Sequence number": 246743, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1336757, "ts": 1295650525049.865, "dur": 41.868, "args": { "External id": 15193,"Sequence number": 246743, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650525053.074, "dur": 7.020, "args": { "External id": 15194,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 8689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650525055.300, "dur": 4.089, "args": { "External id": 15195,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650525062.060, "dur": 29.122, "args": { "External id": 15196,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 8691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650525118.335, "dur": 4.273, "args": { "External id": 15197,"Sequence number": 246743, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8692 } }, { "ph": "s", "id": 25, "pid": 1336757, "tid": 1336757, "ts": 1295650525118.335, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650525124.804, "dur": 1.555, "args": { "External id": 15198,"Sequence number": 246744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8693 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650525154.426, "dur": 71698.303, "args": { "External id": 15199,"Sequence number": 246744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 8694 } }, { "ph": "s", "id": 24, "pid": 1336757, "tid": 1336757, "ts": 1295650525154.426, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1336757, "ts": 1295650525168.102, "dur": 29.313, "args": { "External id": 15200,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1336757, "ts": 1295650525169.348, "dur": 27.876, "args": { "External id": 15201,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650525170.737, "dur": 7.361, "args": { "External id": 15202,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650525172.303, "dur": 5.325, "args": { "External id": 15203,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650525179.027, "dur": 17.625, "args": { "External id": 15204,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 8699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336757, "tid": 1336757, "ts": 1295650525214.694, "dur": 50.708, "args": { "External id": 15205,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650525215.989, "dur": 6.193, "args": { "External id": 15206,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650525218.110, "dur": 3.792, "args": { "External id": 15207,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650525223.052, "dur": 42.034, "args": { "External id": 15208,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 8703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650525224.437, "dur": 39.521, "args": { "External id": 15209,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336757, "tid": 1336757, "ts": 1295650525272.305, "dur": 42.608, "args": { "External id": 15210,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 8705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650525273.669, "dur": 10.169, "args": { "External id": 15211,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 8706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650525278.175, "dur": 5.249, "args": { "External id": 15212,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650525295.722, "dur": 18.892, "args": { "External id": 15213,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650525296.836, "dur": 17.187, "args": { "External id": 15214,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 8709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1336757, "ts": 1295650525321.975, "dur": 27.203, "args": { "External id": 15215,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650525324.310, "dur": 6.608, "args": { "External id": 15216,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650525331.701, "dur": 17.071, "args": { "External id": 15217,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 8712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650525333.011, "dur": 15.252, "args": { "External id": 15218,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336757, "tid": 1336757, "ts": 1295650525359.693, "dur": 31.403, "args": { "External id": 15219,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650525395.551, "dur": 64.593, "args": { "External id": 15220,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650525399.536, "dur": 60.110, "args": { "External id": 15221,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650525406.088, "dur": 1.541, "args": { "External id": 15222,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650525409.782, "dur": 28.649, "args": { "External id": 15223,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650525411.871, "dur": 26.340, "args": { "External id": 15224,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 8719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650525416.702, "dur": 3.694, "args": { "External id": 15225,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650525421.518, "dur": 16.279, "args": { "External id": 15226,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 8721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336757, "tid": 1336757, "ts": 1295650525465.657, "dur": 64959.533, "args": { "External id": 15227,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 8722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336757, "tid": 1336757, "ts": 1295650525467.833, "dur": 64955.398, "args": { "External id": 15228,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 8723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650590442.222, "dur": 11.169, "args": { "External id": 15229,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650590449.157, "dur": 1.747, "args": { "External id": 15230,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650590461.196, "dur": 125.650, "args": { "External id": 15231,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650590463.097, "dur": 11.629, "args": { "External id": 15232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650590466.067, "dur": 7.795, "args": { "External id": 15233,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650590472.736, "dur": 0.849, "args": { "External id": 15234,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650590476.261, "dur": 109.825, "args": { "External id": 15235,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650590478.359, "dur": 106.500, "args": { "External id": 15236,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650590591.040, "dur": 5.312, "args": { "External id": 15237,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650590593.407, "dur": 1.067, "args": { "External id": 15238,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650590609.115, "dur": 4.173, "args": { "External id": 15239,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650590626.439, "dur": 8.209, "args": { "External id": 15240,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650590629.177, "dur": 5.173, "args": { "External id": 15241,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650590786.537, "dur": 300.435, "args": { "External id": 15242,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650590792.105, "dur": 2.530, "args": { "External id": 15243,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650590799.605, "dur": 286.681, "args": { "External id": 15244,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650590803.124, "dur": 0.600, "args": { "External id": 15245,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650590807.189, "dur": 32.905, "args": { "External id": 15246,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650590842.804, "dur": 6.176, "args": { "External id": 15247,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650590847.704, "dur": 0.867, "args": { "External id": 15248,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650590850.639, "dur": 29.951, "args": { "External id": 15249,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650590852.159, "dur": 1.871, "args": { "External id": 15250,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650590856.331, "dur": 23.942, "args": { "External id": 15251,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650590861.126, "dur": 3.607, "args": { "External id": 15252,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650590885.987, "dur": 31.119, "args": { "External id": 15253,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650590919.997, "dur": 18.227, "args": { "External id": 15254,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650590942.586, "dur": 20.696, "args": { "External id": 15255,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650590965.772, "dur": 51.430, "args": { "External id": 15256,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650591021.001, "dur": 26.875, "args": { "External id": 15257,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650591023.869, "dur": 2.332, "args": { "External id": 15258,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650591028.601, "dur": 1.083, "args": { "External id": 15259,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650591053.227, "dur": 16.365, "args": { "External id": 15260,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650591071.956, "dur": 13.029, "args": { "External id": 15261,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650591095.778, "dur": 2.706, "args": { "External id": 15262,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650591106.981, "dur": 4.750, "args": { "External id": 15263,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650591109.970, "dur": 0.850, "args": { "External id": 15264,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650591198.781, "dur": 110.791, "args": { "External id": 15265,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650591319.565, "dur": 7.350, "args": { "External id": 15266,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650591323.307, "dur": 1.470, "args": { "External id": 15267,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650591330.750, "dur": 32.393, "args": { "External id": 15268,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650591370.731, "dur": 7.509, "args": { "External id": 15269,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650591372.889, "dur": 4.351, "args": { "External id": 15270,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650591375.123, "dur": 1.853, "args": { "External id": 15271,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650591383.101, "dur": 54.057, "args": { "External id": 15272,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650591384.654, "dur": 51.863, "args": { "External id": 15273,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650591444.199, "dur": 20.291, "args": { "External id": 15274,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650591473.838, "dur": 4.755, "args": { "External id": 15275,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650591476.589, "dur": 0.693, "args": { "External id": 15276,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650591483.549, "dur": 56.012, "args": { "External id": 15277,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650591484.504, "dur": 4.453, "args": { "External id": 15278,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650591485.544, "dur": 2.805, "args": { "External id": 15279,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650591487.260, "dur": 0.946, "args": { "External id": 15280,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650591491.993, "dur": 47.173, "args": { "External id": 15281,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650591493.143, "dur": 45.293, "args": { "External id": 15282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650591543.979, "dur": 6.824, "args": { "External id": 15283,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650591546.210, "dur": 3.062, "args": { "External id": 15284,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650591558.925, "dur": 1.960, "args": { "External id": 15285,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650591569.828, "dur": 10.602, "args": { "External id": 15286,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650591575.006, "dur": 5.131, "args": { "External id": 15287,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650591687.444, "dur": 210.106, "args": { "External id": 15288,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650591689.686, "dur": 2.308, "args": { "External id": 15289,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650591694.608, "dur": 202.446, "args": { "External id": 15290,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650591696.524, "dur": 0.582, "args": { "External id": 15291,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650591698.702, "dur": 26.732, "args": { "External id": 15292,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650591727.308, "dur": 3.910, "args": { "External id": 15293,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650591729.928, "dur": 0.884, "args": { "External id": 15294,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650591735.305, "dur": 26.906, "args": { "External id": 15295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650591736.350, "dur": 1.905, "args": { "External id": 15296,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650591739.991, "dur": 21.918, "args": { "External id": 15297,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650591745.808, "dur": 3.319, "args": { "External id": 15298,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650591764.358, "dur": 23.069, "args": { "External id": 15299,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650591789.163, "dur": 16.048, "args": { "External id": 15300,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650591808.795, "dur": 15.226, "args": { "External id": 15301,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650591825.903, "dur": 14.596, "args": { "External id": 15302,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650591842.523, "dur": 25.427, "args": { "External id": 15303,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650591846.875, "dur": 2.001, "args": { "External id": 15304,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650591851.543, "dur": 1.173, "args": { "External id": 15305,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650591869.450, "dur": 14.418, "args": { "External id": 15306,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650591885.196, "dur": 10.687, "args": { "External id": 15307,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650591904.705, "dur": 2.242, "args": { "External id": 15308,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650591916.155, "dur": 3.514, "args": { "External id": 15309,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650591918.411, "dur": 0.492, "args": { "External id": 15310,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650592028.167, "dur": 62.719, "args": { "External id": 15311,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650592099.368, "dur": 6.624, "args": { "External id": 15312,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650592102.739, "dur": 1.573, "args": { "External id": 15313,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650592107.400, "dur": 30.287, "args": { "External id": 15314,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650592143.061, "dur": 5.395, "args": { "External id": 15315,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650592144.495, "dur": 3.316, "args": { "External id": 15316,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650592146.619, "dur": 0.939, "args": { "External id": 15317,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650592153.641, "dur": 42.715, "args": { "External id": 15318,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650592154.994, "dur": 40.765, "args": { "External id": 15319,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650592201.508, "dur": 16.488, "args": { "External id": 15320,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650592223.890, "dur": 18.859, "args": { "External id": 15321,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650592225.952, "dur": 0.775, "args": { "External id": 15322,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650592251.267, "dur": 73.990, "args": { "External id": 15323,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650592252.564, "dur": 11.021, "args": { "External id": 15324,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650592256.592, "dur": 6.154, "args": { "External id": 15325,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650592261.498, "dur": 1.042, "args": { "External id": 15326,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650592264.735, "dur": 60.147, "args": { "External id": 15327,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650592266.287, "dur": 57.555, "args": { "External id": 15328,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650592330.654, "dur": 4.766, "args": { "External id": 15329,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650592333.098, "dur": 1.038, "args": { "External id": 15330,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650592342.557, "dur": 1.812, "args": { "External id": 15331,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650592355.432, "dur": 7.167, "args": { "External id": 15332,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650592357.502, "dur": 4.835, "args": { "External id": 15333,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650592473.935, "dur": 233.911, "args": { "External id": 15334,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650592476.878, "dur": 2.409, "args": { "External id": 15335,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650592480.839, "dur": 226.421, "args": { "External id": 15336,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650592484.979, "dur": 0.472, "args": { "External id": 15337,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650592487.013, "dur": 36.591, "args": { "External id": 15338,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650592525.128, "dur": 3.601, "args": { "External id": 15339,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650592527.547, "dur": 0.910, "args": { "External id": 15340,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650592532.072, "dur": 26.952, "args": { "External id": 15341,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650592535.593, "dur": 1.807, "args": { "External id": 15342,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650592538.982, "dur": 19.760, "args": { "External id": 15343,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650592542.429, "dur": 2.967, "args": { "External id": 15344,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650592560.783, "dur": 26.599, "args": { "External id": 15345,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650592589.154, "dur": 24.948, "args": { "External id": 15346,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650592617.059, "dur": 16.776, "args": { "External id": 15347,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650592635.595, "dur": 16.498, "args": { "External id": 15348,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650592654.054, "dur": 24.134, "args": { "External id": 15349,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650592658.046, "dur": 1.745, "args": { "External id": 15350,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650592662.230, "dur": 0.885, "args": { "External id": 15351,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650592679.542, "dur": 13.083, "args": { "External id": 15352,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650592693.885, "dur": 12.110, "args": { "External id": 15353,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650592714.428, "dur": 2.237, "args": { "External id": 15354,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650592725.704, "dur": 3.910, "args": { "External id": 15355,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650592728.267, "dur": 0.577, "args": { "External id": 15356,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650592800.001, "dur": 58.736, "args": { "External id": 15357,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650592863.695, "dur": 7.034, "args": { "External id": 15358,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650592866.564, "dur": 2.870, "args": { "External id": 15359,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650592872.300, "dur": 26.944, "args": { "External id": 15360,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650592944.939, "dur": 7.672, "args": { "External id": 15361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650592946.475, "dur": 5.313, "args": { "External id": 15362,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650592950.603, "dur": 0.931, "args": { "External id": 15363,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650592955.279, "dur": 88.382, "args": { "External id": 15364,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650592956.281, "dur": 85.933, "args": { "External id": 15365,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650593050.386, "dur": 19.195, "args": { "External id": 15366,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650593076.663, "dur": 5.040, "args": { "External id": 15367,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650593079.450, "dur": 1.037, "args": { "External id": 15368,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650593089.389, "dur": 56.947, "args": { "External id": 15369,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650593090.438, "dur": 4.369, "args": { "External id": 15370,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650593091.593, "dur": 2.655, "args": { "External id": 15371,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650593093.171, "dur": 0.939, "args": { "External id": 15372,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650593095.610, "dur": 50.286, "args": { "External id": 15373,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650593096.207, "dur": 48.735, "args": { "External id": 15374,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650593152.738, "dur": 3.667, "args": { "External id": 15375,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650593154.491, "dur": 0.819, "args": { "External id": 15376,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650593163.127, "dur": 1.704, "args": { "External id": 15377,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650593173.397, "dur": 8.846, "args": { "External id": 15378,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650593175.464, "dur": 6.461, "args": { "External id": 15379,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650593321.937, "dur": 218.901, "args": { "External id": 15380,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650593325.665, "dur": 5.371, "args": { "External id": 15381,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650593333.541, "dur": 206.936, "args": { "External id": 15382,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650593335.831, "dur": 0.453, "args": { "External id": 15383,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650593338.451, "dur": 32.288, "args": { "External id": 15384,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650593372.450, "dur": 4.072, "args": { "External id": 15385,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650593375.031, "dur": 0.999, "args": { "External id": 15386,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650593378.032, "dur": 28.738, "args": { "External id": 15387,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650593379.161, "dur": 1.623, "args": { "External id": 15388,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650593382.519, "dur": 23.895, "args": { "External id": 15389,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650593390.435, "dur": 2.709, "args": { "External id": 15390,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650593408.375, "dur": 23.629, "args": { "External id": 15391,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650593433.660, "dur": 16.157, "args": { "External id": 15392,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650593453.000, "dur": 15.431, "args": { "External id": 15393,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650593469.943, "dur": 15.394, "args": { "External id": 15394,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650593486.953, "dur": 22.195, "args": { "External id": 15395,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650593488.592, "dur": 2.039, "args": { "External id": 15396,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650593493.364, "dur": 1.031, "args": { "External id": 15397,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650593513.008, "dur": 14.157, "args": { "External id": 15398,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650593528.336, "dur": 11.019, "args": { "External id": 15399,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650593548.543, "dur": 2.840, "args": { "External id": 15400,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650593561.238, "dur": 4.401, "args": { "External id": 15401,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650593564.087, "dur": 0.613, "args": { "External id": 15402,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650593641.426, "dur": 62.744, "args": { "External id": 15403,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650593708.884, "dur": 6.052, "args": { "External id": 15404,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650593711.918, "dur": 1.627, "args": { "External id": 15405,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650593719.187, "dur": 26.331, "args": { "External id": 15406,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650593750.638, "dur": 5.474, "args": { "External id": 15407,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650593752.174, "dur": 3.167, "args": { "External id": 15408,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650593754.302, "dur": 0.831, "args": { "External id": 15409,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650593759.082, "dur": 41.589, "args": { "External id": 15410,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650593759.995, "dur": 40.095, "args": { "External id": 15411,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650593805.387, "dur": 15.496, "args": { "External id": 15412,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650593828.837, "dur": 4.159, "args": { "External id": 15413,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650593831.136, "dur": 0.875, "args": { "External id": 15414,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650593837.317, "dur": 53.655, "args": { "External id": 15415,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650593838.024, "dur": 6.580, "args": { "External id": 15416,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650593838.786, "dur": 5.178, "args": { "External id": 15417,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650593840.626, "dur": 3.114, "args": { "External id": 15418,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650593847.577, "dur": 42.811, "args": { "External id": 15419,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650593848.469, "dur": 41.222, "args": { "External id": 15420,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650593894.853, "dur": 4.066, "args": { "External id": 15421,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650593896.984, "dur": 0.769, "args": { "External id": 15422,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650593904.568, "dur": 1.676, "args": { "External id": 15423,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650593913.991, "dur": 6.556, "args": { "External id": 15424,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650593916.277, "dur": 3.935, "args": { "External id": 15425,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650594053.778, "dur": 231.584, "args": { "External id": 15426,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650594056.866, "dur": 3.433, "args": { "External id": 15427,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650594062.217, "dur": 222.422, "args": { "External id": 15428,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650594063.699, "dur": 0.356, "args": { "External id": 15429,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650594068.196, "dur": 24.481, "args": { "External id": 15430,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650594093.961, "dur": 4.499, "args": { "External id": 15431,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650594096.730, "dur": 1.195, "args": { "External id": 15432,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650594099.805, "dur": 28.302, "args": { "External id": 15433,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650594100.834, "dur": 4.066, "args": { "External id": 15434,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650594106.726, "dur": 21.054, "args": { "External id": 15435,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650594111.767, "dur": 3.082, "args": { "External id": 15436,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650594129.493, "dur": 22.187, "args": { "External id": 15437,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650594153.213, "dur": 14.151, "args": { "External id": 15438,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650594170.475, "dur": 15.556, "args": { "External id": 15439,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650594187.386, "dur": 13.911, "args": { "External id": 15440,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650594203.189, "dur": 22.145, "args": { "External id": 15441,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650594204.938, "dur": 2.476, "args": { "External id": 15442,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650594210.097, "dur": 1.278, "args": { "External id": 15443,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650594245.098, "dur": 19.805, "args": { "External id": 15444,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650594266.428, "dur": 16.710, "args": { "External id": 15445,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650594295.948, "dur": 3.311, "args": { "External id": 15446,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650594311.947, "dur": 5.769, "args": { "External id": 15447,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650594315.792, "dur": 0.740, "args": { "External id": 15448,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650594396.217, "dur": 66.024, "args": { "External id": 15449,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650594467.215, "dur": 7.245, "args": { "External id": 15450,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650594472.095, "dur": 1.053, "args": { "External id": 15451,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650594475.900, "dur": 26.312, "args": { "External id": 15452,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650594506.609, "dur": 7.883, "args": { "External id": 15453,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650594508.742, "dur": 5.013, "args": { "External id": 15454,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650594510.616, "dur": 2.900, "args": { "External id": 15455,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650594517.399, "dur": 41.190, "args": { "External id": 15456,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650594518.683, "dur": 39.346, "args": { "External id": 15457,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650594565.044, "dur": 15.619, "args": { "External id": 15458,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650594586.831, "dur": 4.336, "args": { "External id": 15459,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650594589.227, "dur": 1.016, "args": { "External id": 15460,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650594595.670, "dur": 52.364, "args": { "External id": 15461,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650594596.761, "dur": 6.453, "args": { "External id": 15462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650594597.634, "dur": 5.006, "args": { "External id": 15463,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650594601.550, "dur": 0.969, "args": { "External id": 15464,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650594603.731, "dur": 43.916, "args": { "External id": 15465,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650594604.910, "dur": 41.941, "args": { "External id": 15466,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650594652.103, "dur": 3.764, "args": { "External id": 15467,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650594654.101, "dur": 0.699, "args": { "External id": 15468,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650594672.850, "dur": 1.687, "args": { "External id": 15469,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650594684.878, "dur": 9.498, "args": { "External id": 15470,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650594687.306, "dur": 6.794, "args": { "External id": 15471,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650594777.270, "dur": 245.599, "args": { "External id": 15472,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650594779.848, "dur": 2.863, "args": { "External id": 15473,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650594784.151, "dur": 237.588, "args": { "External id": 15474,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650594795.573, "dur": 0.355, "args": { "External id": 15475,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650594799.042, "dur": 23.880, "args": { "External id": 15476,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650594826.768, "dur": 6.266, "args": { "External id": 15477,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650594829.327, "dur": 3.244, "args": { "External id": 15478,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650594834.291, "dur": 23.172, "args": { "External id": 15479,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650594835.288, "dur": 1.954, "args": { "External id": 15480,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650594838.861, "dur": 18.257, "args": { "External id": 15481,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650594841.528, "dur": 2.976, "args": { "External id": 15482,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650594859.364, "dur": 20.937, "args": { "External id": 15483,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650594881.808, "dur": 15.275, "args": { "External id": 15484,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650594900.145, "dur": 15.612, "args": { "External id": 15485,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650594917.058, "dur": 13.306, "args": { "External id": 15486,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650594934.374, "dur": 22.925, "args": { "External id": 15487,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650594936.274, "dur": 2.051, "args": { "External id": 15488,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650594940.634, "dur": 2.556, "args": { "External id": 15489,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650594958.717, "dur": 12.690, "args": { "External id": 15490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650594972.252, "dur": 11.277, "args": { "External id": 15491,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650595032.717, "dur": 2.530, "args": { "External id": 15492,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650595044.822, "dur": 4.717, "args": { "External id": 15493,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650595047.870, "dur": 0.678, "args": { "External id": 15494,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650595122.440, "dur": 57.578, "args": { "External id": 15495,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650595184.636, "dur": 5.665, "args": { "External id": 15496,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650595187.671, "dur": 1.475, "args": { "External id": 15497,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650595191.427, "dur": 25.479, "args": { "External id": 15498,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650595221.417, "dur": 24.866, "args": { "External id": 15499,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650595222.775, "dur": 22.272, "args": { "External id": 15500,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650595227.039, "dur": 17.100, "args": { "External id": 15501,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650595251.307, "dur": 63.443, "args": { "External id": 15502,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650595253.281, "dur": 60.490, "args": { "External id": 15503,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650595320.417, "dur": 19.377, "args": { "External id": 15504,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650595346.366, "dur": 4.830, "args": { "External id": 15505,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650595348.968, "dur": 1.045, "args": { "External id": 15506,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650595355.770, "dur": 53.425, "args": { "External id": 15507,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650595359.549, "dur": 4.213, "args": { "External id": 15508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650595360.371, "dur": 2.749, "args": { "External id": 15509,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650595362.095, "dur": 0.871, "args": { "External id": 15510,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650595364.375, "dur": 44.393, "args": { "External id": 15511,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650595365.149, "dur": 42.973, "args": { "External id": 15512,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650595413.444, "dur": 4.129, "args": { "External id": 15513,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650595415.354, "dur": 1.099, "args": { "External id": 15514,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650595424.164, "dur": 1.668, "args": { "External id": 15515,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650595436.381, "dur": 7.112, "args": { "External id": 15516,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650595438.494, "dur": 4.738, "args": { "External id": 15517,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650595532.389, "dur": 202.303, "args": { "External id": 15518,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650595537.376, "dur": 2.215, "args": { "External id": 15519,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650595540.945, "dur": 193.306, "args": { "External id": 15520,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650595542.818, "dur": 0.371, "args": { "External id": 15521,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650595546.829, "dur": 26.703, "args": { "External id": 15522,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650595574.985, "dur": 5.768, "args": { "External id": 15523,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650595579.580, "dur": 0.885, "args": { "External id": 15524,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650595581.938, "dur": 22.411, "args": { "External id": 15525,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650595582.834, "dur": 1.544, "args": { "External id": 15526,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650595585.973, "dur": 18.094, "args": { "External id": 15527,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650595588.610, "dur": 3.054, "args": { "External id": 15528,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650595605.766, "dur": 22.630, "args": { "External id": 15529,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650595629.741, "dur": 14.800, "args": { "External id": 15530,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650595647.080, "dur": 15.460, "args": { "External id": 15531,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650595664.074, "dur": 13.630, "args": { "External id": 15532,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650595681.815, "dur": 23.353, "args": { "External id": 15533,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650595686.238, "dur": 2.234, "args": { "External id": 15534,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650595690.452, "dur": 0.764, "args": { "External id": 15535,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650595706.650, "dur": 13.587, "args": { "External id": 15536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650595721.172, "dur": 12.117, "args": { "External id": 15537,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650595743.422, "dur": 1.862, "args": { "External id": 15538,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650595753.292, "dur": 3.711, "args": { "External id": 15539,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650595755.658, "dur": 0.598, "args": { "External id": 15540,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650595817.697, "dur": 50.872, "args": { "External id": 15541,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650595873.143, "dur": 5.298, "args": { "External id": 15542,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650595876.158, "dur": 1.195, "args": { "External id": 15543,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650595879.653, "dur": 24.640, "args": { "External id": 15544,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650595908.407, "dur": 8.211, "args": { "External id": 15545,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650595909.704, "dur": 6.112, "args": { "External id": 15546,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650595913.943, "dur": 1.669, "args": { "External id": 15547,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650595919.117, "dur": 39.361, "args": { "External id": 15548,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650595920.241, "dur": 37.652, "args": { "External id": 15549,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650595962.684, "dur": 15.202, "args": { "External id": 15550,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650595982.550, "dur": 44.575, "args": { "External id": 15551,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596023.828, "dur": 1.524, "args": { "External id": 15552,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650596035.373, "dur": 56.458, "args": { "External id": 15553,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650596036.358, "dur": 4.404, "args": { "External id": 15554,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650596037.793, "dur": 2.462, "args": { "External id": 15555,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596039.352, "dur": 0.747, "args": { "External id": 15556,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650596041.512, "dur": 49.951, "args": { "External id": 15557,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650596042.410, "dur": 48.256, "args": { "External id": 15558,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650596098.471, "dur": 4.437, "args": { "External id": 15559,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596100.921, "dur": 0.881, "args": { "External id": 15560,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650596108.381, "dur": 1.822, "args": { "External id": 15561,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650596117.600, "dur": 6.960, "args": { "External id": 15562,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650596119.654, "dur": 4.533, "args": { "External id": 15563,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650596217.406, "dur": 236.709, "args": { "External id": 15564,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650596222.088, "dur": 2.557, "args": { "External id": 15565,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650596226.206, "dur": 227.293, "args": { "External id": 15566,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650596243.584, "dur": 0.614, "args": { "External id": 15567,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650596246.518, "dur": 33.537, "args": { "External id": 15568,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650596282.571, "dur": 7.891, "args": { "External id": 15569,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596288.225, "dur": 1.700, "args": { "External id": 15570,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650596291.906, "dur": 29.896, "args": { "External id": 15571,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650596294.164, "dur": 2.684, "args": { "External id": 15572,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650596299.046, "dur": 22.362, "args": { "External id": 15573,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650596304.419, "dur": 3.160, "args": { "External id": 15574,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650596323.454, "dur": 24.256, "args": { "External id": 15575,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650596349.856, "dur": 15.387, "args": { "External id": 15576,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650596368.163, "dur": 16.238, "args": { "External id": 15577,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650596385.914, "dur": 13.677, "args": { "External id": 15578,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650596401.231, "dur": 22.139, "args": { "External id": 15579,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650596403.359, "dur": 1.735, "args": { "External id": 15580,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596407.658, "dur": 1.201, "args": { "External id": 15581,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650596427.310, "dur": 12.388, "args": { "External id": 15582,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650596440.732, "dur": 11.625, "args": { "External id": 15583,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650596463.021, "dur": 2.782, "args": { "External id": 15584,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650596476.074, "dur": 3.858, "args": { "External id": 15585,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596478.603, "dur": 0.519, "args": { "External id": 15586,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650596556.942, "dur": 58.239, "args": { "External id": 15587,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650596620.184, "dur": 5.353, "args": { "External id": 15588,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596623.423, "dur": 0.965, "args": { "External id": 15589,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650596629.071, "dur": 24.486, "args": { "External id": 15590,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650596657.954, "dur": 5.936, "args": { "External id": 15591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650596659.825, "dur": 3.524, "args": { "External id": 15592,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596661.947, "dur": 1.195, "args": { "External id": 15593,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650596666.703, "dur": 40.945, "args": { "External id": 15594,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650596667.773, "dur": 39.194, "args": { "External id": 15595,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650596711.642, "dur": 15.584, "args": { "External id": 15596,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650596734.384, "dur": 29.833, "args": { "External id": 15597,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650596737.032, "dur": 26.746, "args": { "External id": 15598,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596745.165, "dur": 1.170, "args": { "External id": 15599,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650596770.521, "dur": 30.768, "args": { "External id": 15600,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650596772.440, "dur": 28.631, "args": { "External id": 15601,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 9096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596777.264, "dur": 4.759, "args": { "External id": 15602,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650596783.414, "dur": 17.194, "args": { "External id": 15603,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1336757, "ts": 1295650596817.087, "dur": 6.055, "args": { "External id": 15604,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9099 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1336757, "ts": 1295650596819.014, "dur": 3.788, "args": { "External id": 15605,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1336757, "ts": 1295650596824.161, "dur": 3.713, "args": { "External id": 15606,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9101 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1336757, "ts": 1295650596827.196, "dur": 0.606, "args": { "External id": 15607,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650596870.188, "dur": 22.542, "args": { "External id": 15608,"Sequence number": 246745, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9103 } }, { "ph": "s", "id": 23, "pid": 1336757, "tid": 1336757, "ts": 1295650596870.188, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650596898.460, "dur": 6.097, "args": { "External id": 15609,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 9104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596902.000, "dur": 1.023, "args": { "External id": 15610,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1336757, "ts": 1295650596907.238, "dur": 8.221, "args": { "External id": 15611,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "1"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 9106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596913.521, "dur": 0.766, "args": { "External id": 15612,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "2"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650596916.815, "dur": 3.540, "args": { "External id": 15613,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 9108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596918.821, "dur": 0.907, "args": { "External id": 15614,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "2"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 9109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650596923.987, "dur": 6.734, "args": { "External id": 15615,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9110 } }, { "ph": "s", "id": 22, "pid": 1336757, "tid": 1336757, "ts": 1295650596923.987, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596928.281, "dur": 1.148, "args": { "External id": 15616,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650596931.673, "dur": 7.339, "args": { "External id": 15617,"Sequence number": 246747, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9112 } }, { "ph": "s", "id": 21, "pid": 1336757, "tid": 1336757, "ts": 1295650596931.673, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596936.762, "dur": 1.432, "args": { "External id": 15618,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1336757, "ts": 1295650596940.076, "dur": 5.308, "args": { "External id": 15619,"Sequence number": 246748, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 9114 } }, { "ph": "s", "id": 20, "pid": 1336757, "tid": 1336757, "ts": 1295650596940.076, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596943.598, "dur": 0.977, "args": { "External id": 15620,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650596946.315, "dur": 5.452, "args": { "External id": 15621,"Sequence number": 246749, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 9116 } }, { "ph": "s", "id": 19, "pid": 1336757, "tid": 1336757, "ts": 1295650596946.315, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650596949.628, "dur": 1.284, "args": { "External id": 15622,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 9117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1336757, "ts": 1295650596956.044, "dur": 74.391, "args": { "External id": 15623,"Sequence number": 246750, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1336757, "ts": 1295650596957.559, "dur": 72.639, "args": { "External id": 15624,"Sequence number": 246750, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650596960.486, "dur": 8.076, "args": { "External id": 15625,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 9120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650596964.534, "dur": 3.465, "args": { "External id": 15626,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650596969.316, "dur": 60.113, "args": { "External id": 15627,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 9122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650597060.169, "dur": 4.880, "args": { "External id": 15628,"Sequence number": 246750, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 9123 } }, { "ph": "s", "id": 18, "pid": 1336757, "tid": 1336757, "ts": 1295650597060.169, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650597067.256, "dur": 1.484, "args": { "External id": 15629,"Sequence number": 246751, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9124 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650597101.664, "dur": 42048.153, "args": { "External id": 15630,"Sequence number": 246751, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 9125 } }, { "ph": "s", "id": 17, "pid": 1336757, "tid": 1336757, "ts": 1295650597101.664, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1336757, "ts": 1295650597117.011, "dur": 34.485, "args": { "External id": 15631,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1336757, "ts": 1295650597120.127, "dur": 31.159, "args": { "External id": 15632,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650597121.444, "dur": 9.132, "args": { "External id": 15633,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650597123.563, "dur": 6.519, "args": { "External id": 15634,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650597131.325, "dur": 19.517, "args": { "External id": 15635,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 9130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336757, "tid": 1336757, "ts": 1295650597167.780, "dur": 27.180, "args": { "External id": 15636,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650597169.061, "dur": 6.607, "args": { "External id": 15637,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650597171.172, "dur": 4.179, "args": { "External id": 15638,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650597177.520, "dur": 17.222, "args": { "External id": 15639,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650597179.554, "dur": 14.803, "args": { "External id": 15640,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336757, "tid": 1336757, "ts": 1295650597198.719, "dur": 22.442, "args": { "External id": 15641,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650597199.486, "dur": 4.976, "args": { "External id": 15642,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650597201.088, "dur": 3.087, "args": { "External id": 15643,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650597207.508, "dur": 13.465, "args": { "External id": 15644,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650597208.116, "dur": 12.536, "args": { "External id": 15645,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 9140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1336757, "ts": 1295650597226.706, "dur": 49.400, "args": { "External id": 15646,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650597244.916, "dur": 5.896, "args": { "External id": 15647,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650597252.421, "dur": 23.377, "args": { "External id": 15648,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 9143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650597253.525, "dur": 21.677, "args": { "External id": 15649,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336757, "tid": 1336757, "ts": 1295650597283.454, "dur": 31.562, "args": { "External id": 15650,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650597319.427, "dur": 83.949, "args": { "External id": 15651,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650597346.514, "dur": 56.318, "args": { "External id": 15652,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650597356.308, "dur": 1.402, "args": { "External id": 15653,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650597359.793, "dur": 24.508, "args": { "External id": 15654,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650597361.297, "dur": 22.807, "args": { "External id": 15655,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 9150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650597364.038, "dur": 3.218, "args": { "External id": 15656,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650597368.456, "dur": 15.297, "args": { "External id": 15657,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 9152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336757, "tid": 1336757, "ts": 1295650597408.152, "dur": 35450.307, "args": { "External id": 15658,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336757, "tid": 1336757, "ts": 1295650597410.081, "dur": 35445.637, "args": { "External id": 15659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650632874.970, "dur": 9.963, "args": { "External id": 15660,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650632881.152, "dur": 1.697, "args": { "External id": 15661,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650632893.330, "dur": 136.848, "args": { "External id": 15662,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650632895.152, "dur": 7.105, "args": { "External id": 15663,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650632897.815, "dur": 3.627, "args": { "External id": 15664,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650632900.133, "dur": 1.095, "args": { "External id": 15665,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650632903.783, "dur": 125.655, "args": { "External id": 15666,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650632905.733, "dur": 122.175, "args": { "External id": 15667,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650633036.141, "dur": 5.702, "args": { "External id": 15668,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650633038.951, "dur": 1.287, "args": { "External id": 15669,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650633053.926, "dur": 2.751, "args": { "External id": 15670,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650633067.047, "dur": 8.533, "args": { "External id": 15671,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650633069.576, "dur": 5.672, "args": { "External id": 15672,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650633207.983, "dur": 264.599, "args": { "External id": 15673,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650633213.043, "dur": 2.894, "args": { "External id": 15674,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650633220.251, "dur": 251.601, "args": { "External id": 15675,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650633222.336, "dur": 0.460, "args": { "External id": 15676,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650633224.387, "dur": 50.537, "args": { "External id": 15677,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650633278.542, "dur": 8.833, "args": { "External id": 15678,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650633284.847, "dur": 1.944, "args": { "External id": 15679,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650633289.141, "dur": 34.963, "args": { "External id": 15680,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650633291.170, "dur": 3.073, "args": { "External id": 15681,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650633296.295, "dur": 27.423, "args": { "External id": 15682,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650633301.226, "dur": 4.280, "args": { "External id": 15683,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650633329.131, "dur": 30.676, "args": { "External id": 15684,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650633361.625, "dur": 15.302, "args": { "External id": 15685,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650633380.548, "dur": 17.928, "args": { "External id": 15686,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650633399.898, "dur": 15.062, "args": { "External id": 15687,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650633416.809, "dur": 22.685, "args": { "External id": 15688,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650633418.928, "dur": 1.864, "args": { "External id": 15689,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650633423.606, "dur": 0.866, "args": { "External id": 15690,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650633442.997, "dur": 14.016, "args": { "External id": 15691,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650633458.594, "dur": 12.260, "args": { "External id": 15692,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650633482.128, "dur": 3.095, "args": { "External id": 15693,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650633493.954, "dur": 5.654, "args": { "External id": 15694,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650633497.251, "dur": 1.230, "args": { "External id": 15695,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650633583.970, "dur": 74.825, "args": { "External id": 15696,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650633664.768, "dur": 6.915, "args": { "External id": 15697,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650633668.012, "dur": 0.861, "args": { "External id": 15698,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650633675.702, "dur": 30.364, "args": { "External id": 15699,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650633711.992, "dur": 6.721, "args": { "External id": 15700,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650633714.222, "dur": 3.796, "args": { "External id": 15701,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650633716.423, "dur": 1.340, "args": { "External id": 15702,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650633721.973, "dur": 44.987, "args": { "External id": 15703,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650633723.440, "dur": 42.809, "args": { "External id": 15704,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650633771.782, "dur": 16.749, "args": { "External id": 15705,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650633797.507, "dur": 4.197, "args": { "External id": 15706,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650633799.858, "dur": 0.918, "args": { "External id": 15707,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650633806.588, "dur": 58.297, "args": { "External id": 15708,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650633807.641, "dur": 4.049, "args": { "External id": 15709,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650633808.450, "dur": 2.683, "args": { "External id": 15710,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650633809.922, "dur": 1.076, "args": { "External id": 15711,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650633814.631, "dur": 49.816, "args": { "External id": 15712,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650633821.503, "dur": 42.215, "args": { "External id": 15713,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650633868.821, "dur": 6.326, "args": { "External id": 15714,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650633870.924, "dur": 3.086, "args": { "External id": 15715,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650633881.673, "dur": 1.654, "args": { "External id": 15716,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650633891.393, "dur": 8.994, "args": { "External id": 15717,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650633895.940, "dur": 4.141, "args": { "External id": 15718,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650634030.999, "dur": 234.096, "args": { "External id": 15719,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650634033.780, "dur": 3.687, "args": { "External id": 15720,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650634039.297, "dur": 225.122, "args": { "External id": 15721,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650634041.204, "dur": 0.471, "args": { "External id": 15722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650634043.279, "dur": 29.152, "args": { "External id": 15723,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650634077.285, "dur": 3.918, "args": { "External id": 15724,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650634079.701, "dur": 1.117, "args": { "External id": 15725,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650634084.376, "dur": 25.496, "args": { "External id": 15726,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650634085.709, "dur": 3.689, "args": { "External id": 15727,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650634090.841, "dur": 18.666, "args": { "External id": 15728,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650634093.628, "dur": 3.082, "args": { "External id": 15729,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650634111.750, "dur": 23.498, "args": { "External id": 15730,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650634136.722, "dur": 15.243, "args": { "External id": 15731,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650634155.400, "dur": 14.235, "args": { "External id": 15732,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650634171.090, "dur": 14.607, "args": { "External id": 15733,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650634187.184, "dur": 25.011, "args": { "External id": 15734,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650634191.431, "dur": 1.771, "args": { "External id": 15735,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650634195.718, "dur": 1.340, "args": { "External id": 15736,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650634213.674, "dur": 27.374, "args": { "External id": 15737,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650634244.065, "dur": 18.217, "args": { "External id": 15738,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650634275.862, "dur": 3.208, "args": { "External id": 15739,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650634291.333, "dur": 5.488, "args": { "External id": 15740,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650634294.695, "dur": 0.996, "args": { "External id": 15741,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650634381.567, "dur": 63.719, "args": { "External id": 15742,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650634452.716, "dur": 5.221, "args": { "External id": 15743,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650634455.659, "dur": 1.134, "args": { "External id": 15744,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650634459.665, "dur": 26.469, "args": { "External id": 15745,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650634491.209, "dur": 6.431, "args": { "External id": 15746,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650634493.205, "dur": 3.735, "args": { "External id": 15747,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650634495.461, "dur": 1.280, "args": { "External id": 15748,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650634502.885, "dur": 45.308, "args": { "External id": 15749,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650634504.430, "dur": 42.912, "args": { "External id": 15750,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650634552.330, "dur": 19.962, "args": { "External id": 15751,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650634578.133, "dur": 3.924, "args": { "External id": 15752,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650634580.446, "dur": 0.786, "args": { "External id": 15753,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650634586.573, "dur": 53.044, "args": { "External id": 15754,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650634587.519, "dur": 8.275, "args": { "External id": 15755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650634590.744, "dur": 4.395, "args": { "External id": 15756,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650634594.011, "dur": 0.995, "args": { "External id": 15757,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650634596.391, "dur": 42.839, "args": { "External id": 15758,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650634597.273, "dur": 41.357, "args": { "External id": 15759,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650634643.976, "dur": 4.245, "args": { "External id": 15760,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650634646.068, "dur": 0.970, "args": { "External id": 15761,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650634653.982, "dur": 1.589, "args": { "External id": 15762,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650634666.242, "dur": 6.739, "args": { "External id": 15763,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650634668.681, "dur": 3.938, "args": { "External id": 15764,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650634757.787, "dur": 339.009, "args": { "External id": 15765,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650634760.790, "dur": 2.733, "args": { "External id": 15766,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650634765.094, "dur": 331.144, "args": { "External id": 15767,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650634769.295, "dur": 0.423, "args": { "External id": 15768,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650634771.129, "dur": 23.597, "args": { "External id": 15769,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650634796.371, "dur": 4.113, "args": { "External id": 15770,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650634799.037, "dur": 1.034, "args": { "External id": 15771,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650634803.745, "dur": 26.414, "args": { "External id": 15772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650634807.019, "dur": 1.403, "args": { "External id": 15773,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650634809.594, "dur": 20.232, "args": { "External id": 15774,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650634812.175, "dur": 2.838, "args": { "External id": 15775,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650634831.799, "dur": 23.886, "args": { "External id": 15776,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650634857.173, "dur": 37.556, "args": { "External id": 15777,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650634897.755, "dur": 38.611, "args": { "External id": 15778,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650634937.661, "dur": 38.831, "args": { "External id": 15779,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650634978.318, "dur": 67.260, "args": { "External id": 15780,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650635018.949, "dur": 2.812, "args": { "External id": 15781,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650635024.710, "dur": 1.295, "args": { "External id": 15782,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650635047.325, "dur": 24.228, "args": { "External id": 15783,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650635072.817, "dur": 22.094, "args": { "External id": 15784,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650635105.272, "dur": 2.424, "args": { "External id": 15785,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650635117.297, "dur": 4.140, "args": { "External id": 15786,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650635119.784, "dur": 0.776, "args": { "External id": 15787,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650635193.796, "dur": 81.507, "args": { "External id": 15788,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650635283.707, "dur": 8.077, "args": { "External id": 15789,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650635287.984, "dur": 1.730, "args": { "External id": 15790,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650635293.940, "dur": 29.098, "args": { "External id": 15791,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650635329.004, "dur": 11.230, "args": { "External id": 15792,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650635330.961, "dur": 8.379, "args": { "External id": 15793,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650635335.496, "dur": 3.622, "args": { "External id": 15794,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650635343.803, "dur": 47.328, "args": { "External id": 15795,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650635345.077, "dur": 45.415, "args": { "External id": 15796,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650635395.588, "dur": 18.438, "args": { "External id": 15797,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650635420.093, "dur": 4.365, "args": { "External id": 15798,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650635422.685, "dur": 0.897, "args": { "External id": 15799,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650635428.733, "dur": 52.807, "args": { "External id": 15800,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650635432.773, "dur": 4.253, "args": { "External id": 15801,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650635433.767, "dur": 2.549, "args": { "External id": 15802,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650635435.249, "dur": 0.939, "args": { "External id": 15803,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650635437.796, "dur": 43.388, "args": { "External id": 15804,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650635438.289, "dur": 42.187, "args": { "External id": 15805,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650635485.400, "dur": 3.940, "args": { "External id": 15806,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650635487.522, "dur": 0.780, "args": { "External id": 15807,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650635498.328, "dur": 1.698, "args": { "External id": 15808,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650635508.674, "dur": 7.600, "args": { "External id": 15809,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650635510.654, "dur": 5.321, "args": { "External id": 15810,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650635608.458, "dur": 201.037, "args": { "External id": 15811,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650635610.832, "dur": 2.568, "args": { "External id": 15812,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650635619.502, "dur": 189.495, "args": { "External id": 15813,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650635621.012, "dur": 0.315, "args": { "External id": 15814,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650635622.517, "dur": 23.200, "args": { "External id": 15815,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650635647.844, "dur": 6.300, "args": { "External id": 15816,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650635650.434, "dur": 3.113, "args": { "External id": 15817,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650635655.374, "dur": 22.506, "args": { "External id": 15818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650635656.909, "dur": 1.507, "args": { "External id": 15819,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650635659.679, "dur": 17.864, "args": { "External id": 15820,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650635662.063, "dur": 2.845, "args": { "External id": 15821,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650635682.040, "dur": 22.250, "args": { "External id": 15822,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650635705.630, "dur": 15.139, "args": { "External id": 15823,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650635724.073, "dur": 14.462, "args": { "External id": 15824,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650635740.263, "dur": 14.197, "args": { "External id": 15825,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650635756.315, "dur": 21.170, "args": { "External id": 15826,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650635758.169, "dur": 1.913, "args": { "External id": 15827,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650635762.302, "dur": 0.780, "args": { "External id": 15828,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650635781.103, "dur": 14.447, "args": { "External id": 15829,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650635796.522, "dur": 11.244, "args": { "External id": 15830,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650635815.922, "dur": 1.848, "args": { "External id": 15831,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650635826.290, "dur": 3.693, "args": { "External id": 15832,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650635828.815, "dur": 0.412, "args": { "External id": 15833,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650635893.888, "dur": 47.195, "args": { "External id": 15834,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650635945.680, "dur": 6.800, "args": { "External id": 15835,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650635948.448, "dur": 2.933, "args": { "External id": 15836,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650635953.795, "dur": 22.607, "args": { "External id": 15837,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650635982.541, "dur": 42.270, "args": { "External id": 15838,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650635983.834, "dur": 39.744, "args": { "External id": 15839,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636021.789, "dur": 1.384, "args": { "External id": 15840,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650636028.422, "dur": 49.438, "args": { "External id": 15841,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650636029.869, "dur": 47.279, "args": { "External id": 15842,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650636082.030, "dur": 16.744, "args": { "External id": 15843,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650636104.968, "dur": 6.541, "args": { "External id": 15844,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636109.486, "dur": 1.042, "args": { "External id": 15845,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650636115.174, "dur": 51.431, "args": { "External id": 15846,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650636116.398, "dur": 4.614, "args": { "External id": 15847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650636118.132, "dur": 2.207, "args": { "External id": 15848,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636119.484, "dur": 0.713, "args": { "External id": 15849,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650636121.568, "dur": 44.631, "args": { "External id": 15850,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650636124.773, "dur": 40.828, "args": { "External id": 15851,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650636170.719, "dur": 4.104, "args": { "External id": 15852,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636172.886, "dur": 0.788, "args": { "External id": 15853,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650636181.808, "dur": 1.459, "args": { "External id": 15854,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650636190.462, "dur": 7.067, "args": { "External id": 15855,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650636192.848, "dur": 4.407, "args": { "External id": 15856,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650636319.122, "dur": 254.394, "args": { "External id": 15857,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650636321.924, "dur": 5.484, "args": { "External id": 15858,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650636329.328, "dur": 243.748, "args": { "External id": 15859,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650636331.019, "dur": 0.382, "args": { "External id": 15860,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650636332.954, "dur": 24.440, "args": { "External id": 15861,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650636358.921, "dur": 7.183, "args": { "External id": 15862,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636364.170, "dur": 1.562, "args": { "External id": 15863,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650636367.166, "dur": 24.582, "args": { "External id": 15864,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650636368.235, "dur": 1.694, "args": { "External id": 15865,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650636371.178, "dur": 20.273, "args": { "External id": 15866,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650636374.398, "dur": 3.700, "args": { "External id": 15867,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650636395.640, "dur": 22.929, "args": { "External id": 15868,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650636419.846, "dur": 14.444, "args": { "External id": 15869,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650636437.439, "dur": 17.341, "args": { "External id": 15870,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650636456.247, "dur": 13.857, "args": { "External id": 15871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650636471.976, "dur": 70.857, "args": { "External id": 15872,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650636520.387, "dur": 1.558, "args": { "External id": 15873,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636524.612, "dur": 0.780, "args": { "External id": 15874,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650636546.356, "dur": 12.046, "args": { "External id": 15875,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650636559.342, "dur": 12.479, "args": { "External id": 15876,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650636581.672, "dur": 2.695, "args": { "External id": 15877,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650636595.022, "dur": 4.391, "args": { "External id": 15878,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636597.850, "dur": 0.396, "args": { "External id": 15879,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650636671.820, "dur": 67.315, "args": { "External id": 15880,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650636744.392, "dur": 6.665, "args": { "External id": 15881,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636749.041, "dur": 0.918, "args": { "External id": 15882,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650636752.478, "dur": 26.585, "args": { "External id": 15883,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650636783.715, "dur": 5.917, "args": { "External id": 15884,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650636785.369, "dur": 3.665, "args": { "External id": 15885,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636787.279, "dur": 1.514, "args": { "External id": 15886,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650636792.368, "dur": 43.931, "args": { "External id": 15887,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650636793.389, "dur": 42.341, "args": { "External id": 15888,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650636842.721, "dur": 15.873, "args": { "External id": 15889,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650636864.729, "dur": 3.642, "args": { "External id": 15890,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636866.814, "dur": 0.783, "args": { "External id": 15891,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650636872.372, "dur": 51.732, "args": { "External id": 15892,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650636873.134, "dur": 6.363, "args": { "External id": 15893,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650636873.864, "dur": 5.105, "args": { "External id": 15894,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636877.777, "dur": 1.042, "args": { "External id": 15895,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650636880.069, "dur": 43.725, "args": { "External id": 15896,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650636880.598, "dur": 42.395, "args": { "External id": 15897,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650636927.990, "dur": 3.924, "args": { "External id": 15898,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650636929.912, "dur": 0.899, "args": { "External id": 15899,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650636937.528, "dur": 1.612, "args": { "External id": 15900,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650636948.616, "dur": 6.541, "args": { "External id": 15901,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650636950.539, "dur": 4.366, "args": { "External id": 15902,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650637084.098, "dur": 243.326, "args": { "External id": 15903,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650637089.285, "dur": 3.170, "args": { "External id": 15904,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650637094.060, "dur": 232.784, "args": { "External id": 15905,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650637095.476, "dur": 0.379, "args": { "External id": 15906,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650637097.519, "dur": 24.717, "args": { "External id": 15907,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650637126.421, "dur": 6.100, "args": { "External id": 15908,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650637131.022, "dur": 1.174, "args": { "External id": 15909,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650637133.394, "dur": 21.707, "args": { "External id": 15910,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650637134.231, "dur": 1.714, "args": { "External id": 15911,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650637137.086, "dur": 17.722, "args": { "External id": 15912,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650637140.133, "dur": 2.767, "args": { "External id": 15913,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650637156.684, "dur": 24.363, "args": { "External id": 15914,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650637182.436, "dur": 15.189, "args": { "External id": 15915,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650637200.632, "dur": 14.252, "args": { "External id": 15916,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650637216.213, "dur": 33.303, "args": { "External id": 15917,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650637255.006, "dur": 33.310, "args": { "External id": 15918,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650637257.985, "dur": 3.192, "args": { "External id": 15919,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650637264.411, "dur": 1.589, "args": { "External id": 15920,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650637290.793, "dur": 18.270, "args": { "External id": 15921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650637310.316, "dur": 15.136, "args": { "External id": 15922,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650637337.108, "dur": 2.758, "args": { "External id": 15923,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650637350.263, "dur": 4.469, "args": { "External id": 15924,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650637353.499, "dur": 0.460, "args": { "External id": 15925,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650637431.110, "dur": 64.313, "args": { "External id": 15926,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650637500.691, "dur": 4.713, "args": { "External id": 15927,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650637503.479, "dur": 0.878, "args": { "External id": 15928,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650637507.027, "dur": 24.991, "args": { "External id": 15929,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650637536.802, "dur": 8.614, "args": { "External id": 15930,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650637538.739, "dur": 6.089, "args": { "External id": 15931,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650637543.005, "dur": 1.645, "args": { "External id": 15932,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650637548.317, "dur": 41.680, "args": { "External id": 15933,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650637549.889, "dur": 39.370, "args": { "External id": 15934,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650637594.238, "dur": 15.469, "args": { "External id": 15935,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650637615.327, "dur": 3.986, "args": { "External id": 15936,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650637617.368, "dur": 1.051, "args": { "External id": 15937,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650637623.697, "dur": 50.348, "args": { "External id": 15938,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650637626.994, "dur": 3.729, "args": { "External id": 15939,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650637627.573, "dur": 2.481, "args": { "External id": 15940,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650637629.007, "dur": 0.914, "args": { "External id": 15941,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650637631.511, "dur": 42.123, "args": { "External id": 15942,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650637632.467, "dur": 40.536, "args": { "External id": 15943,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650637678.526, "dur": 6.659, "args": { "External id": 15944,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650637680.871, "dur": 3.014, "args": { "External id": 15945,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650637690.977, "dur": 1.455, "args": { "External id": 15946,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650637701.502, "dur": 6.732, "args": { "External id": 15947,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650637703.785, "dur": 4.220, "args": { "External id": 15948,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650637791.532, "dur": 242.857, "args": { "External id": 15949,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650637794.188, "dur": 2.272, "args": { "External id": 15950,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650637798.077, "dur": 235.673, "args": { "External id": 15951,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650637799.630, "dur": 0.386, "args": { "External id": 15952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650637803.939, "dur": 23.496, "args": { "External id": 15953,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650637828.820, "dur": 3.670, "args": { "External id": 15954,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650637831.301, "dur": 0.780, "args": { "External id": 15955,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650637843.173, "dur": 24.022, "args": { "External id": 15956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650637844.114, "dur": 3.468, "args": { "External id": 15957,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650637848.818, "dur": 17.868, "args": { "External id": 15958,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650637851.751, "dur": 2.643, "args": { "External id": 15959,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650637868.781, "dur": 22.039, "args": { "External id": 15960,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650637892.351, "dur": 14.741, "args": { "External id": 15961,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650637909.656, "dur": 15.543, "args": { "External id": 15962,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650637928.780, "dur": 13.010, "args": { "External id": 15963,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650637943.470, "dur": 21.075, "args": { "External id": 15964,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650637945.449, "dur": 1.442, "args": { "External id": 15965,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650637948.803, "dur": 0.814, "args": { "External id": 15966,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650637965.785, "dur": 12.579, "args": { "External id": 15967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650637979.375, "dur": 50.453, "args": { "External id": 15968,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650638043.391, "dur": 2.607, "args": { "External id": 15969,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650638055.200, "dur": 4.485, "args": { "External id": 15970,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650638058.321, "dur": 0.542, "args": { "External id": 15971,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650638127.779, "dur": 58.367, "args": { "External id": 15972,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650638190.993, "dur": 5.391, "args": { "External id": 15973,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650638193.878, "dur": 1.361, "args": { "External id": 15974,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650638202.284, "dur": 46.882, "args": { "External id": 15975,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650638258.860, "dur": 10.905, "args": { "External id": 15976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650638261.186, "dur": 7.271, "args": { "External id": 15977,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650638263.890, "dur": 4.194, "args": { "External id": 15978,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650638273.708, "dur": 62.073, "args": { "External id": 15979,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650638275.464, "dur": 59.584, "args": { "External id": 15980,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650638340.732, "dur": 18.021, "args": { "External id": 15981,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650638365.359, "dur": 6.996, "args": { "External id": 15982,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650638370.446, "dur": 0.858, "args": { "External id": 15983,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650638376.239, "dur": 52.773, "args": { "External id": 15984,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650638377.153, "dur": 3.825, "args": { "External id": 15985,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650638377.932, "dur": 2.420, "args": { "External id": 15986,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650638379.289, "dur": 0.922, "args": { "External id": 15987,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650638381.551, "dur": 47.051, "args": { "External id": 15988,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650638384.709, "dur": 43.332, "args": { "External id": 15989,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650638432.693, "dur": 4.698, "args": { "External id": 15990,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650638435.149, "dur": 1.030, "args": { "External id": 15991,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650638443.589, "dur": 1.889, "args": { "External id": 15992,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650638453.335, "dur": 10.138, "args": { "External id": 15993,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650638457.692, "dur": 5.484, "args": { "External id": 15994,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650638553.100, "dur": 196.338, "args": { "External id": 15995,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650638555.608, "dur": 2.440, "args": { "External id": 15996,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650638562.422, "dur": 186.456, "args": { "External id": 15997,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650638563.975, "dur": 0.407, "args": { "External id": 15998,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650638565.542, "dur": 23.391, "args": { "External id": 15999,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650638590.767, "dur": 5.592, "args": { "External id": 16000,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650638593.239, "dur": 2.657, "args": { "External id": 16001,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650638597.330, "dur": 25.890, "args": { "External id": 16002,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650638601.451, "dur": 1.398, "args": { "External id": 16003,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650638604.201, "dur": 18.782, "args": { "External id": 16004,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650638606.701, "dur": 3.002, "args": { "External id": 16005,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650638624.851, "dur": 21.089, "args": { "External id": 16006,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650638647.631, "dur": 14.738, "args": { "External id": 16007,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650638664.991, "dur": 15.100, "args": { "External id": 16008,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650638681.398, "dur": 13.096, "args": { "External id": 16009,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650638695.933, "dur": 25.137, "args": { "External id": 16010,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650638698.561, "dur": 1.514, "args": { "External id": 16011,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650638703.821, "dur": 2.853, "args": { "External id": 16012,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650638722.591, "dur": 13.209, "args": { "External id": 16013,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650638736.829, "dur": 11.049, "args": { "External id": 16014,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650638755.817, "dur": 1.914, "args": { "External id": 16015,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650638766.219, "dur": 3.439, "args": { "External id": 16016,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650638768.332, "dur": 0.669, "args": { "External id": 16017,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650638831.963, "dur": 47.502, "args": { "External id": 16018,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650638884.019, "dur": 6.853, "args": { "External id": 16019,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650638889.045, "dur": 0.794, "args": { "External id": 16020,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650638892.381, "dur": 23.704, "args": { "External id": 16021,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650638920.297, "dur": 5.784, "args": { "External id": 16022,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650638921.960, "dur": 3.574, "args": { "External id": 16023,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650638923.588, "dur": 1.753, "args": { "External id": 16024,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650638928.337, "dur": 42.489, "args": { "External id": 16025,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650638931.640, "dur": 38.556, "args": { "External id": 16026,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650638974.664, "dur": 55.267, "args": { "External id": 16027,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650639036.781, "dur": 28.509, "args": { "External id": 16028,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650639039.611, "dur": 25.268, "args": { "External id": 16029,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639045.514, "dur": 1.598, "args": { "External id": 16030,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650639071.910, "dur": 28.098, "args": { "External id": 16031,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650639073.586, "dur": 26.154, "args": { "External id": 16032,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 9527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639078.446, "dur": 4.193, "args": { "External id": 16033,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650639083.746, "dur": 15.583, "args": { "External id": 16034,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1336757, "ts": 1295650639113.106, "dur": 7.518, "args": { "External id": 16035,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9530 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1336757, "ts": 1295650639117.184, "dur": 3.161, "args": { "External id": 16036,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1336757, "ts": 1295650639121.795, "dur": 1.568, "args": { "External id": 16037,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9532 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1336757, "ts": 1295650639122.375, "dur": 0.697, "args": { "External id": 16038,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650639165.842, "dur": 22.644, "args": { "External id": 16039,"Sequence number": 246752, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650639191.001, "dur": 15.185, "args": { "External id": 16040,"Sequence number": 246753, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9535 } }, { "ph": "s", "id": 16, "pid": 1336757, "tid": 1336757, "ts": 1295650639191.001, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650639212.954, "dur": 6.651, "args": { "External id": 16041,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 9536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639216.846, "dur": 1.291, "args": { "External id": 16042,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1336757, "ts": 1295650639224.359, "dur": 25.655, "args": { "External id": 16043,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "2"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 9538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639246.028, "dur": 1.597, "args": { "External id": 16044,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "3"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650639252.576, "dur": 5.040, "args": { "External id": 16045,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 9540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639255.560, "dur": 1.091, "args": { "External id": 16046,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "3"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 9541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650639264.180, "dur": 11.076, "args": { "External id": 16047,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9542 } }, { "ph": "s", "id": 15, "pid": 1336757, "tid": 1336757, "ts": 1295650639264.180, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639271.664, "dur": 1.621, "args": { "External id": 16048,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650639276.989, "dur": 6.905, "args": { "External id": 16049,"Sequence number": 246755, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9544 } }, { "ph": "s", "id": 14, "pid": 1336757, "tid": 1336757, "ts": 1295650639276.989, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639281.582, "dur": 0.988, "args": { "External id": 16050,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1336757, "ts": 1295650639286.001, "dur": 9.492, "args": { "External id": 16051,"Sequence number": 246756, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 9546 } }, { "ph": "s", "id": 13, "pid": 1336757, "tid": 1336757, "ts": 1295650639286.001, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639293.259, "dur": 0.961, "args": { "External id": 16052,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650639297.125, "dur": 6.361, "args": { "External id": 16053,"Sequence number": 246757, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 9548 } }, { "ph": "s", "id": 12, "pid": 1336757, "tid": 1336757, "ts": 1295650639297.125, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639300.854, "dur": 1.275, "args": { "External id": 16054,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 9549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1336757, "ts": 1295650639309.316, "dur": 36.051, "args": { "External id": 16055,"Sequence number": 246758, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1336757, "ts": 1295650639310.693, "dur": 34.463, "args": { "External id": 16056,"Sequence number": 246758, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650639313.282, "dur": 7.849, "args": { "External id": 16057,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 9552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650639315.865, "dur": 4.766, "args": { "External id": 16058,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650639322.239, "dur": 22.470, "args": { "External id": 16059,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 9554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650639374.102, "dur": 7.047, "args": { "External id": 16060,"Sequence number": 246758, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 9555 } }, { "ph": "s", "id": 11, "pid": 1336757, "tid": 1336757, "ts": 1295650639374.102, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650639383.440, "dur": 1.160, "args": { "External id": 16061,"Sequence number": 246759, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9556 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650639420.520, "dur": 42875.390, "args": { "External id": 16062,"Sequence number": 246759, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 9557 } }, { "ph": "s", "id": 10, "pid": 1336757, "tid": 1336757, "ts": 1295650639420.520, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1336757, "ts": 1295650639438.619, "dur": 27.784, "args": { "External id": 16063,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1336757, "ts": 1295650639439.590, "dur": 26.640, "args": { "External id": 16064,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650639441.037, "dur": 6.385, "args": { "External id": 16065,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650639442.491, "dur": 4.176, "args": { "External id": 16066,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650639448.170, "dur": 17.438, "args": { "External id": 16067,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 9562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336757, "tid": 1336757, "ts": 1295650639482.305, "dur": 26.728, "args": { "External id": 16068,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650639483.423, "dur": 6.469, "args": { "External id": 16069,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639485.749, "dur": 3.856, "args": { "External id": 16070,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650639491.348, "dur": 17.455, "args": { "External id": 16071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650639493.154, "dur": 15.263, "args": { "External id": 16072,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336757, "tid": 1336757, "ts": 1295650639512.381, "dur": 21.754, "args": { "External id": 16073,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650639513.301, "dur": 6.453, "args": { "External id": 16074,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639516.661, "dur": 2.825, "args": { "External id": 16075,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650639520.489, "dur": 13.452, "args": { "External id": 16076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650639520.953, "dur": 12.519, "args": { "External id": 16077,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 9572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1336757, "ts": 1295650639540.146, "dur": 20.315, "args": { "External id": 16078,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650639544.116, "dur": 2.610, "args": { "External id": 16079,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650639547.362, "dur": 12.812, "args": { "External id": 16080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 9575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650639547.880, "dur": 11.783, "args": { "External id": 16081,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336757, "tid": 1336757, "ts": 1295650639567.485, "dur": 22.879, "args": { "External id": 16082,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650639593.156, "dur": 51.219, "args": { "External id": 16083,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650639595.500, "dur": 48.378, "args": { "External id": 16084,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639600.569, "dur": 1.104, "args": { "External id": 16085,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650639602.843, "dur": 25.284, "args": { "External id": 16086,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650639604.597, "dur": 23.321, "args": { "External id": 16087,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 9582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650639609.076, "dur": 2.986, "args": { "External id": 16088,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650639612.944, "dur": 14.513, "args": { "External id": 16089,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 9584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336757, "tid": 1336757, "ts": 1295650639648.039, "dur": 36320.230, "args": { "External id": 16090,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336757, "tid": 1336757, "ts": 1295650639649.303, "dur": 36316.988, "args": { "External id": 16091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650676006.205, "dur": 11.482, "args": { "External id": 16092,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650676013.752, "dur": 1.393, "args": { "External id": 16093,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650676024.190, "dur": 121.309, "args": { "External id": 16094,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650676026.184, "dur": 6.621, "args": { "External id": 16095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650676028.455, "dur": 3.491, "args": { "External id": 16096,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650676030.190, "dur": 1.456, "args": { "External id": 16097,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650676034.577, "dur": 110.134, "args": { "External id": 16098,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650676039.439, "dur": 103.945, "args": { "External id": 16099,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650676149.802, "dur": 5.259, "args": { "External id": 16100,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650676152.317, "dur": 0.836, "args": { "External id": 16101,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650676164.055, "dur": 2.552, "args": { "External id": 16102,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650676176.928, "dur": 7.901, "args": { "External id": 16103,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650676179.209, "dur": 5.328, "args": { "External id": 16104,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650676349.588, "dur": 224.428, "args": { "External id": 16105,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650676353.326, "dur": 4.045, "args": { "External id": 16106,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650676361.606, "dur": 211.822, "args": { "External id": 16107,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650676363.692, "dur": 0.432, "args": { "External id": 16108,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650676365.614, "dur": 28.749, "args": { "External id": 16109,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650676396.290, "dur": 6.169, "args": { "External id": 16110,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650676398.803, "dur": 3.264, "args": { "External id": 16111,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650676403.599, "dur": 28.729, "args": { "External id": 16112,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650676405.171, "dur": 1.558, "args": { "External id": 16113,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650676410.657, "dur": 21.378, "args": { "External id": 16114,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650676414.694, "dur": 3.063, "args": { "External id": 16115,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650676434.523, "dur": 23.674, "args": { "External id": 16116,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650676460.277, "dur": 16.595, "args": { "External id": 16117,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650676480.272, "dur": 17.307, "args": { "External id": 16118,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650676499.431, "dur": 14.460, "args": { "External id": 16119,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650676516.040, "dur": 27.402, "args": { "External id": 16120,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650676518.436, "dur": 1.625, "args": { "External id": 16121,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650676524.829, "dur": 2.880, "args": { "External id": 16122,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650676545.144, "dur": 13.213, "args": { "External id": 16123,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650676560.094, "dur": 12.585, "args": { "External id": 16124,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650676582.493, "dur": 2.612, "args": { "External id": 16125,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650676592.875, "dur": 5.294, "args": { "External id": 16126,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650676595.693, "dur": 1.297, "args": { "External id": 16127,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650676677.212, "dur": 75.664, "args": { "External id": 16128,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650676758.735, "dur": 8.748, "args": { "External id": 16129,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650676763.369, "dur": 1.113, "args": { "External id": 16130,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650676769.283, "dur": 26.475, "args": { "External id": 16131,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650676801.440, "dur": 7.292, "args": { "External id": 16132,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650676803.324, "dur": 4.546, "args": { "External id": 16133,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650676805.722, "dur": 1.815, "args": { "External id": 16134,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650676812.282, "dur": 48.995, "args": { "External id": 16135,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650676815.700, "dur": 44.750, "args": { "External id": 16136,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650676866.165, "dur": 17.018, "args": { "External id": 16137,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650676889.489, "dur": 3.673, "args": { "External id": 16138,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650676891.499, "dur": 0.696, "args": { "External id": 16139,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650676898.077, "dur": 52.898, "args": { "External id": 16140,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650676898.950, "dur": 6.039, "args": { "External id": 16141,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650676899.661, "dur": 4.780, "args": { "External id": 16142,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650676903.301, "dur": 0.993, "args": { "External id": 16143,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650676905.580, "dur": 44.965, "args": { "External id": 16144,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650676906.141, "dur": 43.769, "args": { "External id": 16145,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650676954.676, "dur": 4.494, "args": { "External id": 16146,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650676956.859, "dur": 0.726, "args": { "External id": 16147,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650676964.848, "dur": 1.765, "args": { "External id": 16148,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650676976.946, "dur": 43.426, "args": { "External id": 16149,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650676979.427, "dur": 40.112, "args": { "External id": 16150,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650677127.027, "dur": 247.317, "args": { "External id": 16151,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650677132.253, "dur": 2.536, "args": { "External id": 16152,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650677136.404, "dur": 237.347, "args": { "External id": 16153,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650677137.887, "dur": 0.450, "args": { "External id": 16154,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650677141.781, "dur": 25.274, "args": { "External id": 16155,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650677168.576, "dur": 5.623, "args": { "External id": 16156,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650677172.873, "dur": 1.028, "args": { "External id": 16157,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650677175.273, "dur": 23.394, "args": { "External id": 16158,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650677176.406, "dur": 1.605, "args": { "External id": 16159,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650677179.167, "dur": 19.171, "args": { "External id": 16160,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650677181.875, "dur": 3.418, "args": { "External id": 16161,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650677200.186, "dur": 24.559, "args": { "External id": 16162,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650677226.137, "dur": 35.011, "args": { "External id": 16163,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650677266.745, "dur": 22.292, "args": { "External id": 16164,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650677293.702, "dur": 18.358, "args": { "External id": 16165,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650677314.496, "dur": 28.160, "args": { "External id": 16166,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650677319.822, "dur": 2.334, "args": { "External id": 16167,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650677325.343, "dur": 0.968, "args": { "External id": 16168,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650677344.494, "dur": 14.331, "args": { "External id": 16169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650677360.045, "dur": 12.518, "args": { "External id": 16170,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650677385.787, "dur": 2.917, "args": { "External id": 16171,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650677399.908, "dur": 4.694, "args": { "External id": 16172,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650677402.706, "dur": 0.646, "args": { "External id": 16173,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650677482.946, "dur": 64.792, "args": { "External id": 16174,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650677553.109, "dur": 5.175, "args": { "External id": 16175,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650677556.223, "dur": 1.066, "args": { "External id": 16176,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650677560.102, "dur": 27.533, "args": { "External id": 16177,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650677592.692, "dur": 8.243, "args": { "External id": 16178,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650677594.435, "dur": 5.865, "args": { "External id": 16179,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650677598.649, "dur": 1.432, "args": { "External id": 16180,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650677604.178, "dur": 42.261, "args": { "External id": 16181,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650677605.537, "dur": 40.119, "args": { "External id": 16182,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650677650.955, "dur": 16.477, "args": { "External id": 16183,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650677673.247, "dur": 4.245, "args": { "External id": 16184,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650677675.685, "dur": 0.944, "args": { "External id": 16185,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650677684.328, "dur": 52.433, "args": { "External id": 16186,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650677685.297, "dur": 3.662, "args": { "External id": 16187,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650677685.964, "dur": 2.493, "args": { "External id": 16188,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650677687.384, "dur": 0.913, "args": { "External id": 16189,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650677689.660, "dur": 46.699, "args": { "External id": 16190,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650677690.944, "dur": 44.728, "args": { "External id": 16191,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650677762.394, "dur": 4.638, "args": { "External id": 16192,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650677764.751, "dur": 0.902, "args": { "External id": 16193,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650677775.327, "dur": 1.534, "args": { "External id": 16194,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650677784.705, "dur": 9.239, "args": { "External id": 16195,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650677786.692, "dur": 6.922, "args": { "External id": 16196,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650677885.638, "dur": 359.495, "args": { "External id": 16197,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650677888.109, "dur": 2.397, "args": { "External id": 16198,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650677892.035, "dur": 352.305, "args": { "External id": 16199,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650677893.858, "dur": 0.442, "args": { "External id": 16200,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650677898.296, "dur": 24.717, "args": { "External id": 16201,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650677924.589, "dur": 3.879, "args": { "External id": 16202,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650677927.076, "dur": 1.082, "args": { "External id": 16203,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650677929.470, "dur": 26.182, "args": { "External id": 16204,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650677930.684, "dur": 1.814, "args": { "External id": 16205,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650677933.844, "dur": 21.505, "args": { "External id": 16206,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650677939.011, "dur": 2.749, "args": { "External id": 16207,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650677957.162, "dur": 57.379, "args": { "External id": 16208,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650678017.631, "dur": 19.624, "args": { "External id": 16209,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650678040.348, "dur": 36.007, "args": { "External id": 16210,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650678080.141, "dur": 42.711, "args": { "External id": 16211,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650678125.100, "dur": 42.008, "args": { "External id": 16212,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650678127.501, "dur": 1.780, "args": { "External id": 16213,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650678131.959, "dur": 1.298, "args": { "External id": 16214,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650678168.636, "dur": 27.859, "args": { "External id": 16215,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650678197.501, "dur": 43.562, "args": { "External id": 16216,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650678258.375, "dur": 3.604, "args": { "External id": 16217,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650678274.877, "dur": 5.853, "args": { "External id": 16218,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650678278.477, "dur": 0.983, "args": { "External id": 16219,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650678369.275, "dur": 66.263, "args": { "External id": 16220,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650678440.858, "dur": 5.699, "args": { "External id": 16221,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650678444.043, "dur": 1.395, "args": { "External id": 16222,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650678448.370, "dur": 27.857, "args": { "External id": 16223,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650678481.256, "dur": 9.989, "args": { "External id": 16224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650678485.691, "dur": 4.732, "args": { "External id": 16225,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650678488.370, "dur": 1.794, "args": { "External id": 16226,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650678499.055, "dur": 43.054, "args": { "External id": 16227,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650678500.284, "dur": 41.158, "args": { "External id": 16228,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650678546.265, "dur": 16.933, "args": { "External id": 16229,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650678569.567, "dur": 5.971, "args": { "External id": 16230,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650678573.705, "dur": 1.039, "args": { "External id": 16231,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650678579.647, "dur": 49.283, "args": { "External id": 16232,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650678580.664, "dur": 3.920, "args": { "External id": 16233,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650678581.466, "dur": 2.520, "args": { "External id": 16234,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650678583.206, "dur": 0.616, "args": { "External id": 16235,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650678585.352, "dur": 43.165, "args": { "External id": 16236,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650678586.460, "dur": 41.480, "args": { "External id": 16237,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650678635.057, "dur": 6.586, "args": { "External id": 16238,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650678637.393, "dur": 2.944, "args": { "External id": 16239,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650678647.770, "dur": 1.633, "args": { "External id": 16240,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650678657.823, "dur": 7.678, "args": { "External id": 16241,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650678660.146, "dur": 5.055, "args": { "External id": 16242,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650678759.596, "dur": 201.138, "args": { "External id": 16243,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650678762.233, "dur": 2.910, "args": { "External id": 16244,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650678767.016, "dur": 193.169, "args": { "External id": 16245,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650678768.370, "dur": 0.574, "args": { "External id": 16246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650678770.578, "dur": 25.730, "args": { "External id": 16247,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650678797.917, "dur": 4.014, "args": { "External id": 16248,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650678800.261, "dur": 1.378, "args": { "External id": 16249,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650678802.967, "dur": 27.995, "args": { "External id": 16250,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650678804.287, "dur": 1.710, "args": { "External id": 16251,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650678809.543, "dur": 21.052, "args": { "External id": 16252,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650678814.735, "dur": 3.211, "args": { "External id": 16253,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650678832.506, "dur": 23.578, "args": { "External id": 16254,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650678857.423, "dur": 13.551, "args": { "External id": 16255,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650678873.966, "dur": 17.011, "args": { "External id": 16256,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650678892.724, "dur": 13.164, "args": { "External id": 16257,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650678907.717, "dur": 24.547, "args": { "External id": 16258,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650678909.453, "dur": 1.831, "args": { "External id": 16259,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650678916.019, "dur": 0.857, "args": { "External id": 16260,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650678933.475, "dur": 13.002, "args": { "External id": 16261,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650678947.702, "dur": 11.153, "args": { "External id": 16262,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650678966.852, "dur": 1.857, "args": { "External id": 16263,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650678977.340, "dur": 3.784, "args": { "External id": 16264,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650678979.781, "dur": 0.473, "args": { "External id": 16265,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650679089.915, "dur": 58.705, "args": { "External id": 16266,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650679154.331, "dur": 8.386, "args": { "External id": 16267,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650679159.457, "dur": 1.804, "args": { "External id": 16268,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650679163.931, "dur": 27.287, "args": { "External id": 16269,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650679195.813, "dur": 5.326, "args": { "External id": 16270,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650679197.271, "dur": 3.097, "args": { "External id": 16271,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650679199.364, "dur": 0.763, "args": { "External id": 16272,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650679203.933, "dur": 67.186, "args": { "External id": 16273,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650679205.097, "dur": 64.442, "args": { "External id": 16274,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650679281.235, "dur": 21.962, "args": { "External id": 16275,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650679310.223, "dur": 5.789, "args": { "External id": 16276,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650679313.540, "dur": 1.383, "args": { "External id": 16277,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650679320.210, "dur": 61.544, "args": { "External id": 16278,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650679321.389, "dur": 9.449, "args": { "External id": 16279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650679322.473, "dur": 7.737, "args": { "External id": 16280,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650679329.066, "dur": 1.010, "args": { "External id": 16281,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650679331.570, "dur": 49.821, "args": { "External id": 16282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650679332.299, "dur": 48.512, "args": { "External id": 16283,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650679394.492, "dur": 4.125, "args": { "External id": 16284,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650679396.523, "dur": 0.895, "args": { "External id": 16285,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650679406.263, "dur": 1.475, "args": { "External id": 16286,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650679415.982, "dur": 9.822, "args": { "External id": 16287,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650679420.846, "dur": 4.669, "args": { "External id": 16288,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650679519.989, "dur": 206.740, "args": { "External id": 16289,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650679524.745, "dur": 2.483, "args": { "External id": 16290,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650679528.697, "dur": 197.387, "args": { "External id": 16291,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650679530.075, "dur": 0.742, "args": { "External id": 16292,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650679532.313, "dur": 23.550, "args": { "External id": 16293,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650679557.900, "dur": 6.120, "args": { "External id": 16294,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650679562.644, "dur": 1.047, "args": { "External id": 16295,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650679565.158, "dur": 25.511, "args": { "External id": 16296,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650679566.253, "dur": 1.942, "args": { "External id": 16297,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650679571.608, "dur": 18.738, "args": { "External id": 16298,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650679574.891, "dur": 3.232, "args": { "External id": 16299,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650679592.276, "dur": 22.550, "args": { "External id": 16300,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650679616.245, "dur": 15.275, "args": { "External id": 16301,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650679633.988, "dur": 14.243, "args": { "External id": 16302,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650679649.768, "dur": 14.682, "args": { "External id": 16303,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650679666.365, "dur": 26.358, "args": { "External id": 16304,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650679670.528, "dur": 1.582, "args": { "External id": 16305,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650679676.464, "dur": 1.186, "args": { "External id": 16306,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650679694.180, "dur": 17.524, "args": { "External id": 16307,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650679712.809, "dur": 12.244, "args": { "External id": 16308,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650679733.592, "dur": 1.956, "args": { "External id": 16309,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650679744.523, "dur": 3.532, "args": { "External id": 16310,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650679746.691, "dur": 0.417, "args": { "External id": 16311,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650679810.083, "dur": 50.178, "args": { "External id": 16312,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650679865.128, "dur": 7.199, "args": { "External id": 16313,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650679870.149, "dur": 1.089, "args": { "External id": 16314,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650679873.432, "dur": 24.313, "args": { "External id": 16315,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650679901.990, "dur": 5.634, "args": { "External id": 16316,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650679903.502, "dur": 3.483, "args": { "External id": 16317,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650679905.487, "dur": 1.295, "args": { "External id": 16318,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650679910.291, "dur": 42.158, "args": { "External id": 16319,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650679913.357, "dur": 38.464, "args": { "External id": 16320,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650679956.442, "dur": 15.127, "args": { "External id": 16321,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650679976.549, "dur": 3.789, "args": { "External id": 16322,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650679978.718, "dur": 0.850, "args": { "External id": 16323,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650680020.331, "dur": 70.701, "args": { "External id": 16324,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650680032.519, "dur": 7.578, "args": { "External id": 16325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650680035.783, "dur": 3.474, "args": { "External id": 16326,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650680037.849, "dur": 1.109, "args": { "External id": 16327,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650680040.784, "dur": 49.685, "args": { "External id": 16328,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650680041.604, "dur": 48.186, "args": { "External id": 16329,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650680095.896, "dur": 4.317, "args": { "External id": 16330,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650680098.046, "dur": 0.760, "args": { "External id": 16331,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650680108.913, "dur": 1.677, "args": { "External id": 16332,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650680118.740, "dur": 8.544, "args": { "External id": 16333,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650680121.005, "dur": 5.967, "args": { "External id": 16334,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650680214.924, "dur": 227.936, "args": { "External id": 16335,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650680216.934, "dur": 2.372, "args": { "External id": 16336,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650680220.567, "dur": 221.674, "args": { "External id": 16337,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650680224.232, "dur": 0.399, "args": { "External id": 16338,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650680226.007, "dur": 47.738, "args": { "External id": 16339,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650680277.160, "dur": 5.650, "args": { "External id": 16340,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650680280.427, "dur": 1.869, "args": { "External id": 16341,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650680283.954, "dur": 27.453, "args": { "External id": 16342,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650680285.344, "dur": 2.759, "args": { "External id": 16343,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650680289.190, "dur": 21.878, "args": { "External id": 16344,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650680294.833, "dur": 2.692, "args": { "External id": 16345,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650680312.833, "dur": 22.855, "args": { "External id": 16346,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650680337.121, "dur": 13.886, "args": { "External id": 16347,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650680356.788, "dur": 16.374, "args": { "External id": 16348,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650680374.678, "dur": 13.311, "args": { "External id": 16349,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650680390.018, "dur": 22.110, "args": { "External id": 16350,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650680391.602, "dur": 2.285, "args": { "External id": 16351,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650680396.188, "dur": 0.863, "args": { "External id": 16352,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650680413.684, "dur": 12.881, "args": { "External id": 16353,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650680429.931, "dur": 11.379, "args": { "External id": 16354,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650680451.059, "dur": 2.120, "args": { "External id": 16355,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650680462.663, "dur": 4.305, "args": { "External id": 16356,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650680465.353, "dur": 0.515, "args": { "External id": 16357,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650680535.738, "dur": 56.488, "args": { "External id": 16358,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650680597.040, "dur": 5.385, "args": { "External id": 16359,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650680599.876, "dur": 1.493, "args": { "External id": 16360,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650680603.894, "dur": 24.941, "args": { "External id": 16361,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650680633.759, "dur": 8.331, "args": { "External id": 16362,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650680638.137, "dur": 3.204, "args": { "External id": 16363,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650680640.044, "dur": 1.113, "args": { "External id": 16364,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650680644.837, "dur": 40.158, "args": { "External id": 16365,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650680645.776, "dur": 38.591, "args": { "External id": 16366,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650680689.131, "dur": 15.762, "args": { "External id": 16367,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650680710.291, "dur": 6.170, "args": { "External id": 16368,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650680714.628, "dur": 0.928, "args": { "External id": 16369,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650680720.308, "dur": 50.825, "args": { "External id": 16370,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650680721.176, "dur": 5.952, "args": { "External id": 16371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650680721.898, "dur": 4.583, "args": { "External id": 16372,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650680723.414, "dur": 2.875, "args": { "External id": 16373,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650680727.925, "dur": 42.726, "args": { "External id": 16374,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650680728.532, "dur": 41.317, "args": { "External id": 16375,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650680774.684, "dur": 4.037, "args": { "External id": 16376,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650680776.557, "dur": 1.033, "args": { "External id": 16377,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650680786.402, "dur": 1.459, "args": { "External id": 16378,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650680794.745, "dur": 6.098, "args": { "External id": 16379,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650680796.915, "dur": 3.619, "args": { "External id": 16380,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650680878.504, "dur": 260.161, "args": { "External id": 16381,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650680881.002, "dur": 2.535, "args": { "External id": 16382,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650680886.798, "dur": 251.275, "args": { "External id": 16383,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650680887.920, "dur": 0.571, "args": { "External id": 16384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650680924.434, "dur": 21.117, "args": { "External id": 16385,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650680947.169, "dur": 3.403, "args": { "External id": 16386,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650680949.558, "dur": 0.752, "args": { "External id": 16387,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650680951.348, "dur": 22.140, "args": { "External id": 16388,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650680952.054, "dur": 3.182, "args": { "External id": 16389,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650680956.322, "dur": 16.933, "args": { "External id": 16390,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650680958.694, "dur": 2.178, "args": { "External id": 16391,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650680974.690, "dur": 57.985, "args": { "External id": 16392,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650681035.173, "dur": 14.955, "args": { "External id": 16393,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650681055.026, "dur": 15.475, "args": { "External id": 16394,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650681071.832, "dur": 13.485, "args": { "External id": 16395,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650681087.313, "dur": 20.710, "args": { "External id": 16396,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650681088.862, "dur": 1.836, "args": { "External id": 16397,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650681092.885, "dur": 0.735, "args": { "External id": 16398,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650681109.506, "dur": 13.645, "args": { "External id": 16399,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650681126.383, "dur": 10.723, "args": { "External id": 16400,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650681146.699, "dur": 2.315, "args": { "External id": 16401,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650681158.216, "dur": 4.065, "args": { "External id": 16402,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650681160.891, "dur": 0.530, "args": { "External id": 16403,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650681249.169, "dur": 77.935, "args": { "External id": 16404,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650681333.411, "dur": 7.371, "args": { "External id": 16405,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650681337.288, "dur": 1.369, "args": { "External id": 16406,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650681342.104, "dur": 26.843, "args": { "External id": 16407,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650681376.983, "dur": 5.869, "args": { "External id": 16408,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650681378.588, "dur": 3.560, "args": { "External id": 16409,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650681380.893, "dur": 1.024, "args": { "External id": 16410,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650681385.701, "dur": 42.982, "args": { "External id": 16411,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650681387.125, "dur": 41.022, "args": { "External id": 16412,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650681433.253, "dur": 15.959, "args": { "External id": 16413,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650681454.740, "dur": 6.270, "args": { "External id": 16414,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650681459.247, "dur": 0.776, "args": { "External id": 16415,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650681465.397, "dur": 56.385, "args": { "External id": 16416,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650681466.247, "dur": 5.940, "args": { "External id": 16417,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650681466.787, "dur": 4.811, "args": { "External id": 16418,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650681470.708, "dur": 0.743, "args": { "External id": 16419,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650681472.894, "dur": 48.541, "args": { "External id": 16420,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650681475.763, "dur": 44.882, "args": { "External id": 16421,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650681525.640, "dur": 3.900, "args": { "External id": 16422,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650681527.449, "dur": 0.915, "args": { "External id": 16423,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650681536.031, "dur": 1.771, "args": { "External id": 16424,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650681545.588, "dur": 8.191, "args": { "External id": 16425,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650681549.851, "dur": 3.630, "args": { "External id": 16426,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650681647.090, "dur": 202.632, "args": { "External id": 16427,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650681650.457, "dur": 2.027, "args": { "External id": 16428,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650681653.999, "dur": 195.154, "args": { "External id": 16429,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650681658.410, "dur": 0.393, "args": { "External id": 16430,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650681660.341, "dur": 24.238, "args": { "External id": 16431,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650681686.062, "dur": 3.840, "args": { "External id": 16432,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650681688.464, "dur": 1.065, "args": { "External id": 16433,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650681690.891, "dur": 32.363, "args": { "External id": 16434,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650681701.155, "dur": 1.807, "args": { "External id": 16435,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650681704.145, "dur": 18.798, "args": { "External id": 16436,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650681706.910, "dur": 2.640, "args": { "External id": 16437,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650681724.805, "dur": 21.945, "args": { "External id": 16438,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650681748.336, "dur": 14.226, "args": { "External id": 16439,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650681765.598, "dur": 14.788, "args": { "External id": 16440,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650681781.699, "dur": 13.812, "args": { "External id": 16441,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650681797.382, "dur": 23.194, "args": { "External id": 16442,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650681799.202, "dur": 1.929, "args": { "External id": 16443,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650681805.504, "dur": 1.044, "args": { "External id": 16444,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650681821.748, "dur": 13.601, "args": { "External id": 16445,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650681836.300, "dur": 11.895, "args": { "External id": 16446,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650681856.404, "dur": 1.780, "args": { "External id": 16447,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650681866.357, "dur": 3.670, "args": { "External id": 16448,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650681868.707, "dur": 0.550, "args": { "External id": 16449,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650681934.615, "dur": 86.310, "args": { "External id": 16450,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650682028.380, "dur": 9.944, "args": { "External id": 16451,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682033.984, "dur": 2.835, "args": { "External id": 16452,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650682039.833, "dur": 31.089, "args": { "External id": 16453,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650682076.174, "dur": 5.527, "args": { "External id": 16454,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650682077.434, "dur": 3.575, "args": { "External id": 16455,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682079.673, "dur": 1.102, "args": { "External id": 16456,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650682084.808, "dur": 48.302, "args": { "External id": 16457,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650682088.465, "dur": 44.006, "args": { "External id": 16458,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650682137.164, "dur": 16.376, "args": { "External id": 16459,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650682158.549, "dur": 26.400, "args": { "External id": 16460,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650682161.257, "dur": 23.165, "args": { "External id": 16461,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682166.724, "dur": 1.335, "args": { "External id": 16462,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650682191.116, "dur": 29.338, "args": { "External id": 16463,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650682192.826, "dur": 27.307, "args": { "External id": 16464,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 9959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682197.477, "dur": 4.720, "args": { "External id": 16465,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650682205.239, "dur": 14.398, "args": { "External id": 16466,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1336757, "ts": 1295650682253.684, "dur": 6.221, "args": { "External id": 16467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9962 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1336757, "ts": 1295650682255.791, "dur": 3.422, "args": { "External id": 16468,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1336757, "ts": 1295650682261.823, "dur": 2.130, "args": { "External id": 16469,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9964 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1336757, "ts": 1295650682262.830, "dur": 0.989, "args": { "External id": 16470,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650682316.902, "dur": 28.423, "args": { "External id": 16471,"Sequence number": 246760, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650682347.219, "dur": 16.303, "args": { "External id": 16472,"Sequence number": 246761, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9967 } }, { "ph": "s", "id": 9, "pid": 1336757, "tid": 1336757, "ts": 1295650682347.219, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650682370.289, "dur": 7.448, "args": { "External id": 16473,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 9968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682374.949, "dur": 1.255, "args": { "External id": 16474,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1336757, "ts": 1295650682386.917, "dur": 6.929, "args": { "External id": 16475,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "3"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 9970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682391.298, "dur": 1.212, "args": { "External id": 16476,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "4"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650682395.277, "dur": 3.366, "args": { "External id": 16477,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 9972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682396.988, "dur": 1.052, "args": { "External id": 16478,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "4"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 9973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650682404.943, "dur": 6.463, "args": { "External id": 16479,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9974 } }, { "ph": "s", "id": 8, "pid": 1336757, "tid": 1336757, "ts": 1295650682404.943, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682408.830, "dur": 1.358, "args": { "External id": 16480,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650682412.660, "dur": 6.209, "args": { "External id": 16481,"Sequence number": 246763, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9976 } }, { "ph": "s", "id": 7, "pid": 1336757, "tid": 1336757, "ts": 1295650682412.660, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682417.334, "dur": 0.757, "args": { "External id": 16482,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336757, "tid": 1336757, "ts": 1295650682419.911, "dur": 8.362, "args": { "External id": 16483,"Sequence number": 246764, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 9978 } }, { "ph": "s", "id": 6, "pid": 1336757, "tid": 1336757, "ts": 1295650682419.911, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682426.523, "dur": 0.921, "args": { "External id": 16484,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650682429.530, "dur": 6.971, "args": { "External id": 16485,"Sequence number": 246765, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 9980 } }, { "ph": "s", "id": 5, "pid": 1336757, "tid": 1336757, "ts": 1295650682429.530, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682432.831, "dur": 2.816, "args": { "External id": 16486,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 9981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1336757, "ts": 1295650682440.822, "dur": 32.913, "args": { "External id": 16487,"Sequence number": 246766, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1336757, "ts": 1295650682442.290, "dur": 31.023, "args": { "External id": 16488,"Sequence number": 246766, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650682444.822, "dur": 7.986, "args": { "External id": 16489,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 9984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650682447.558, "dur": 4.515, "args": { "External id": 16490,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650682453.918, "dur": 18.969, "args": { "External id": 16491,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 9986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650682502.673, "dur": 6.085, "args": { "External id": 16492,"Sequence number": 246766, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 9987 } }, { "ph": "s", "id": 4, "pid": 1336757, "tid": 1336757, "ts": 1295650682502.673, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650682511.370, "dur": 1.288, "args": { "External id": 16493,"Sequence number": 246767, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9988 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336757, "tid": 1336757, "ts": 1295650682545.908, "dur": 43408.949, "args": { "External id": 16494,"Sequence number": 246767, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 9989 } }, { "ph": "s", "id": 3, "pid": 1336757, "tid": 1336757, "ts": 1295650682545.908, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336757, "tid": 1336757, "ts": 1295650682561.204, "dur": 27.335, "args": { "External id": 16495,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1336757, "ts": 1295650682561.942, "dur": 26.379, "args": { "External id": 16496,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650682563.125, "dur": 7.598, "args": { "External id": 16497,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650682564.572, "dur": 5.651, "args": { "External id": 16498,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650682571.452, "dur": 16.442, "args": { "External id": 16499,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 9994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336757, "tid": 1336757, "ts": 1295650682603.460, "dur": 28.698, "args": { "External id": 16500,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650682604.887, "dur": 8.459, "args": { "External id": 16501,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682608.803, "dur": 4.247, "args": { "External id": 16502,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650682614.917, "dur": 17.020, "args": { "External id": 16503,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650682616.910, "dur": 14.556, "args": { "External id": 16504,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336757, "tid": 1336757, "ts": 1295650682635.841, "dur": 19.769, "args": { "External id": 16505,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 10000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650682636.780, "dur": 4.530, "args": { "External id": 16506,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 10001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682638.372, "dur": 2.685, "args": { "External id": 16507,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650682641.776, "dur": 13.645, "args": { "External id": 16508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650682642.402, "dur": 12.628, "args": { "External id": 16509,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 10004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1336757, "ts": 1295650682661.406, "dur": 25.401, "args": { "External id": 16510,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 10005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650682665.864, "dur": 2.987, "args": { "External id": 16511,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295650682669.587, "dur": 16.952, "args": { "External id": 16512,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 10007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650682670.087, "dur": 16.121, "args": { "External id": 16513,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336757, "tid": 1336757, "ts": 1295650682691.573, "dur": 24.160, "args": { "External id": 16514,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650682718.676, "dur": 50.400, "args": { "External id": 16515,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650682720.733, "dur": 47.944, "args": { "External id": 16516,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682725.651, "dur": 2.887, "args": { "External id": 16517,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650682729.544, "dur": 22.082, "args": { "External id": 16518,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650682731.225, "dur": 19.946, "args": { "External id": 16519,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 10014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650682733.766, "dur": 2.844, "args": { "External id": 16520,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650682737.397, "dur": 13.342, "args": { "External id": 16521,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 10016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336757, "tid": 1336757, "ts": 1295650682774.916, "dur": 36987.796, "args": { "External id": 16522,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 10017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336757, "tid": 1336757, "ts": 1295650682776.488, "dur": 36983.344, "args": { "External id": 16523,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 10018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650719780.503, "dur": 9.414, "args": { "External id": 16524,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650719786.324, "dur": 1.672, "args": { "External id": 16525,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650719795.423, "dur": 117.180, "args": { "External id": 16526,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650719797.287, "dur": 9.556, "args": { "External id": 16527,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650719799.841, "dur": 6.082, "args": { "External id": 16528,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650719804.485, "dur": 1.126, "args": { "External id": 16529,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650719808.116, "dur": 103.748, "args": { "External id": 16530,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650719810.128, "dur": 100.660, "args": { "External id": 16531,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650719916.610, "dur": 4.389, "args": { "External id": 16532,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650719918.663, "dur": 0.770, "args": { "External id": 16533,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650719930.641, "dur": 2.815, "args": { "External id": 16534,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650719946.095, "dur": 8.300, "args": { "External id": 16535,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650719948.910, "dur": 5.177, "args": { "External id": 16536,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650720120.825, "dur": 256.899, "args": { "External id": 16537,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650720126.517, "dur": 3.670, "args": { "External id": 16538,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650720132.066, "dur": 244.960, "args": { "External id": 16539,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650720133.738, "dur": 0.836, "args": { "External id": 16540,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650720136.233, "dur": 30.836, "args": { "External id": 16541,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650720171.999, "dur": 6.604, "args": { "External id": 16542,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650720177.155, "dur": 1.077, "args": { "External id": 16543,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650720179.673, "dur": 25.575, "args": { "External id": 16544,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650720180.695, "dur": 1.616, "args": { "External id": 16545,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650720183.631, "dur": 21.258, "args": { "External id": 16546,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650720187.773, "dur": 3.948, "args": { "External id": 16547,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650720207.044, "dur": 43.161, "args": { "External id": 16548,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650720253.731, "dur": 21.591, "args": { "External id": 16549,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650720279.365, "dur": 18.567, "args": { "External id": 16550,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650720300.016, "dur": 14.744, "args": { "External id": 16551,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650720319.317, "dur": 26.482, "args": { "External id": 16552,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650720324.056, "dur": 1.936, "args": { "External id": 16553,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650720328.700, "dur": 1.198, "args": { "External id": 16554,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650720347.339, "dur": 13.934, "args": { "External id": 16555,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650720362.686, "dur": 13.072, "args": { "External id": 16556,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650720387.593, "dur": 3.168, "args": { "External id": 16557,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650720401.187, "dur": 4.684, "args": { "External id": 16558,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650720404.105, "dur": 0.828, "args": { "External id": 16559,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650720488.846, "dur": 76.495, "args": { "External id": 16560,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650720571.536, "dur": 6.055, "args": { "External id": 16561,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650720574.275, "dur": 0.826, "args": { "External id": 16562,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650720579.449, "dur": 30.275, "args": { "External id": 16563,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650720615.387, "dur": 10.040, "args": { "External id": 16564,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650720617.655, "dur": 7.011, "args": { "External id": 16565,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650720622.352, "dur": 2.012, "args": { "External id": 16566,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650720629.030, "dur": 43.006, "args": { "External id": 16567,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650720630.409, "dur": 40.917, "args": { "External id": 16568,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650720676.621, "dur": 17.325, "args": { "External id": 16569,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650720700.353, "dur": 4.303, "args": { "External id": 16570,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650720702.883, "dur": 0.935, "args": { "External id": 16571,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650720711.729, "dur": 49.564, "args": { "External id": 16572,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650720712.504, "dur": 3.732, "args": { "External id": 16573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650720713.217, "dur": 2.443, "args": { "External id": 16574,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650720714.785, "dur": 0.727, "args": { "External id": 16575,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650720716.772, "dur": 44.115, "args": { "External id": 16576,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650720717.422, "dur": 42.878, "args": { "External id": 16577,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650720767.610, "dur": 5.012, "args": { "External id": 16578,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650720769.878, "dur": 1.164, "args": { "External id": 16579,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650720779.077, "dur": 2.047, "args": { "External id": 16580,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650720789.396, "dur": 6.305, "args": { "External id": 16581,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650720791.307, "dur": 4.124, "args": { "External id": 16582,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650720893.387, "dur": 241.754, "args": { "External id": 16583,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650720897.987, "dur": 2.681, "args": { "External id": 16584,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650720902.045, "dur": 232.530, "args": { "External id": 16585,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650720903.444, "dur": 0.330, "args": { "External id": 16586,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650720905.190, "dur": 22.715, "args": { "External id": 16587,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650720929.556, "dur": 4.886, "args": { "External id": 16588,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650720933.594, "dur": 0.590, "args": { "External id": 16589,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650720935.714, "dur": 25.902, "args": { "External id": 16590,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650720937.184, "dur": 1.826, "args": { "External id": 16591,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650720940.570, "dur": 20.781, "args": { "External id": 16592,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650720945.586, "dur": 2.979, "args": { "External id": 16593,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650720963.257, "dur": 61.707, "args": { "External id": 16594,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650721027.664, "dur": 16.049, "args": { "External id": 16595,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650721047.255, "dur": 15.629, "args": { "External id": 16596,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650721064.476, "dur": 14.393, "args": { "External id": 16597,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650721080.999, "dur": 23.365, "args": { "External id": 16598,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650721083.257, "dur": 2.198, "args": { "External id": 16599,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650721087.854, "dur": 0.832, "args": { "External id": 16600,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650721108.208, "dur": 12.668, "args": { "External id": 16601,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650721121.920, "dur": 11.339, "args": { "External id": 16602,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650721144.098, "dur": 2.766, "args": { "External id": 16603,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650721157.572, "dur": 3.887, "args": { "External id": 16604,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650721160.147, "dur": 0.366, "args": { "External id": 16605,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650721254.264, "dur": 74.697, "args": { "External id": 16606,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650721335.869, "dur": 7.058, "args": { "External id": 16607,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650721339.603, "dur": 1.567, "args": { "External id": 16608,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650721346.917, "dur": 28.609, "args": { "External id": 16609,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650721381.209, "dur": 6.520, "args": { "External id": 16610,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650721383.077, "dur": 3.988, "args": { "External id": 16611,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650721384.934, "dur": 1.927, "args": { "External id": 16612,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650721390.848, "dur": 44.915, "args": { "External id": 16613,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650721392.040, "dur": 43.062, "args": { "External id": 16614,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650721440.495, "dur": 17.560, "args": { "External id": 16615,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650721466.363, "dur": 4.421, "args": { "External id": 16616,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650721468.694, "dur": 0.989, "args": { "External id": 16617,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650721474.954, "dur": 51.691, "args": { "External id": 16618,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650721475.858, "dur": 3.827, "args": { "External id": 16619,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650721476.770, "dur": 2.401, "args": { "External id": 16620,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650721477.964, "dur": 1.079, "args": { "External id": 16621,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650721482.575, "dur": 43.638, "args": { "External id": 16622,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650721483.135, "dur": 42.613, "args": { "External id": 16623,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650721531.684, "dur": 7.655, "args": { "External id": 16624,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650721534.043, "dur": 3.538, "args": { "External id": 16625,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650721545.863, "dur": 2.264, "args": { "External id": 16626,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650721556.437, "dur": 6.584, "args": { "External id": 16627,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650721558.414, "dur": 4.337, "args": { "External id": 16628,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650721659.080, "dur": 301.620, "args": { "External id": 16629,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650721661.076, "dur": 2.513, "args": { "External id": 16630,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650721665.491, "dur": 294.657, "args": { "External id": 16631,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650721667.222, "dur": 0.356, "args": { "External id": 16632,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650721668.601, "dur": 25.989, "args": { "External id": 16633,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650721696.290, "dur": 3.706, "args": { "External id": 16634,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650721698.669, "dur": 1.037, "args": { "External id": 16635,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650721700.796, "dur": 27.710, "args": { "External id": 16636,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650721702.451, "dur": 1.815, "args": { "External id": 16637,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650721705.670, "dur": 22.433, "args": { "External id": 16638,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650721712.829, "dur": 2.882, "args": { "External id": 16639,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650721730.133, "dur": 23.851, "args": { "External id": 16640,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650721755.686, "dur": 15.349, "args": { "External id": 16641,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650721773.643, "dur": 22.969, "args": { "External id": 16642,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650721798.112, "dur": 42.666, "args": { "External id": 16643,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650721842.370, "dur": 38.716, "args": { "External id": 16644,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650721844.705, "dur": 1.601, "args": { "External id": 16645,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650721848.401, "dur": 0.960, "args": { "External id": 16646,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650721884.722, "dur": 35.492, "args": { "External id": 16647,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650721921.351, "dur": 37.762, "args": { "External id": 16648,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650721967.430, "dur": 1.974, "args": { "External id": 16649,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650721978.047, "dur": 38.266, "args": { "External id": 16650,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650721980.257, "dur": 0.343, "args": { "External id": 16651,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650722091.063, "dur": 57.843, "args": { "External id": 16652,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650722153.830, "dur": 8.440, "args": { "External id": 16653,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650722159.145, "dur": 1.959, "args": { "External id": 16654,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650722163.420, "dur": 26.857, "args": { "External id": 16655,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650722195.174, "dur": 5.695, "args": { "External id": 16656,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650722196.815, "dur": 3.492, "args": { "External id": 16657,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650722199.145, "dur": 0.998, "args": { "External id": 16658,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650722203.462, "dur": 64.665, "args": { "External id": 16659,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650722204.738, "dur": 62.193, "args": { "External id": 16660,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650722277.517, "dur": 22.376, "args": { "External id": 16661,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650722308.511, "dur": 5.470, "args": { "External id": 16662,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650722311.315, "dur": 1.286, "args": { "External id": 16663,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650722318.481, "dur": 59.393, "args": { "External id": 16664,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650722319.573, "dur": 8.908, "args": { "External id": 16665,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650722320.698, "dur": 7.063, "args": { "External id": 16666,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650722326.650, "dur": 0.967, "args": { "External id": 16667,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650722329.326, "dur": 48.103, "args": { "External id": 16668,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650722330.291, "dur": 46.514, "args": { "External id": 16669,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650722382.168, "dur": 21.485, "args": { "External id": 16670,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650722401.204, "dur": 0.979, "args": { "External id": 16671,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650722410.150, "dur": 1.773, "args": { "External id": 16672,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650722422.324, "dur": 7.188, "args": { "External id": 16673,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650722424.362, "dur": 4.873, "args": { "External id": 16674,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650722521.046, "dur": 197.940, "args": { "External id": 16675,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650722525.084, "dur": 2.116, "args": { "External id": 16676,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650722528.840, "dur": 189.543, "args": { "External id": 16677,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650722530.465, "dur": 0.443, "args": { "External id": 16678,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650722532.110, "dur": 23.985, "args": { "External id": 16679,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650722559.690, "dur": 5.372, "args": { "External id": 16680,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650722563.939, "dur": 0.818, "args": { "External id": 16681,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650722566.170, "dur": 23.393, "args": { "External id": 16682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650722567.403, "dur": 1.741, "args": { "External id": 16683,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650722570.280, "dur": 18.929, "args": { "External id": 16684,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650722573.153, "dur": 2.844, "args": { "External id": 16685,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650722591.095, "dur": 22.680, "args": { "External id": 16686,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650722615.392, "dur": 14.835, "args": { "External id": 16687,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650722633.097, "dur": 14.722, "args": { "External id": 16688,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650722649.210, "dur": 13.138, "args": { "External id": 16689,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650722666.848, "dur": 24.220, "args": { "External id": 16690,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650722671.331, "dur": 1.869, "args": { "External id": 16691,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650722675.668, "dur": 0.765, "args": { "External id": 16692,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650722692.460, "dur": 12.984, "args": { "External id": 16693,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650722706.451, "dur": 10.854, "args": { "External id": 16694,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650722725.349, "dur": 1.887, "args": { "External id": 16695,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650722735.335, "dur": 3.622, "args": { "External id": 16696,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650722737.783, "dur": 0.354, "args": { "External id": 16697,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650722804.358, "dur": 49.321, "args": { "External id": 16698,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650722858.271, "dur": 4.713, "args": { "External id": 16699,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650722860.678, "dur": 1.156, "args": { "External id": 16700,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650722864.384, "dur": 24.914, "args": { "External id": 16701,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650722893.526, "dur": 8.335, "args": { "External id": 16702,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650722894.829, "dur": 6.380, "args": { "External id": 16703,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650722899.411, "dur": 1.604, "args": { "External id": 16704,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650722904.235, "dur": 40.717, "args": { "External id": 16705,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650722905.195, "dur": 38.972, "args": { "External id": 16706,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650722948.597, "dur": 14.961, "args": { "External id": 16707,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650722968.852, "dur": 3.692, "args": { "External id": 16708,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650722970.719, "dur": 1.003, "args": { "External id": 16709,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650722976.164, "dur": 92.684, "args": { "External id": 16710,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650722979.204, "dur": 40.850, "args": { "External id": 16711,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650722980.012, "dur": 39.093, "args": { "External id": 16712,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650723017.780, "dur": 0.922, "args": { "External id": 16713,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650723020.644, "dur": 47.646, "args": { "External id": 16714,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650723021.530, "dur": 46.158, "args": { "External id": 16715,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650723074.195, "dur": 4.533, "args": { "External id": 16716,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650723076.367, "dur": 0.829, "args": { "External id": 16717,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650723084.967, "dur": 1.702, "args": { "External id": 16718,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650723096.442, "dur": 6.451, "args": { "External id": 16719,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650723098.391, "dur": 4.220, "args": { "External id": 16720,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650723185.599, "dur": 244.322, "args": { "External id": 16721,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650723189.844, "dur": 2.475, "args": { "External id": 16722,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650723193.989, "dur": 235.317, "args": { "External id": 16723,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650723195.405, "dur": 0.332, "args": { "External id": 16724,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650723199.311, "dur": 23.086, "args": { "External id": 16725,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650723244.289, "dur": 8.929, "args": { "External id": 16726,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650723250.627, "dur": 1.887, "args": { "External id": 16727,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650723254.802, "dur": 34.182, "args": { "External id": 16728,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650723256.445, "dur": 2.898, "args": { "External id": 16729,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650723260.819, "dur": 27.722, "args": { "External id": 16730,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650723265.116, "dur": 3.779, "args": { "External id": 16731,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650723290.822, "dur": 26.528, "args": { "External id": 16732,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650723319.108, "dur": 16.569, "args": { "External id": 16733,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650723338.765, "dur": 17.098, "args": { "External id": 16734,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650723359.858, "dur": 13.641, "args": { "External id": 16735,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650723374.994, "dur": 23.971, "args": { "External id": 16736,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650723377.567, "dur": 1.853, "args": { "External id": 16737,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650723381.948, "dur": 1.021, "args": { "External id": 16738,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650723400.295, "dur": 13.161, "args": { "External id": 16739,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650723414.392, "dur": 11.393, "args": { "External id": 16740,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650723438.858, "dur": 2.533, "args": { "External id": 16741,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650723451.204, "dur": 3.637, "args": { "External id": 16742,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650723453.479, "dur": 0.445, "args": { "External id": 16743,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650723534.390, "dur": 65.530, "args": { "External id": 16744,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650723604.683, "dur": 5.439, "args": { "External id": 16745,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650723607.772, "dur": 1.042, "args": { "External id": 16746,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650723611.688, "dur": 27.019, "args": { "External id": 16747,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650723644.096, "dur": 8.029, "args": { "External id": 16748,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650723648.107, "dur": 3.396, "args": { "External id": 16749,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650723650.044, "dur": 1.226, "args": { "External id": 16750,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650723655.398, "dur": 41.655, "args": { "External id": 16751,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650723656.514, "dur": 39.890, "args": { "External id": 16752,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650723701.375, "dur": 15.514, "args": { "External id": 16753,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650723722.747, "dur": 6.381, "args": { "External id": 16754,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650723727.375, "dur": 0.722, "args": { "External id": 16755,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650723733.195, "dur": 51.293, "args": { "External id": 16756,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650723734.182, "dur": 3.664, "args": { "External id": 16757,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650723735.050, "dur": 2.260, "args": { "External id": 16758,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650723736.333, "dur": 0.842, "args": { "External id": 16759,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650723738.775, "dur": 45.331, "args": { "External id": 16760,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650723739.668, "dur": 43.878, "args": { "External id": 16761,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650723790.495, "dur": 4.783, "args": { "External id": 16762,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650723792.816, "dur": 1.165, "args": { "External id": 16763,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650723800.784, "dur": 1.589, "args": { "External id": 16764,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650723810.626, "dur": 8.030, "args": { "External id": 16765,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650723812.243, "dur": 6.083, "args": { "External id": 16766,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650723905.712, "dur": 234.833, "args": { "External id": 16767,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650723907.760, "dur": 2.210, "args": { "External id": 16768,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650723911.667, "dur": 228.215, "args": { "External id": 16769,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650723913.116, "dur": 0.511, "args": { "External id": 16770,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650723914.874, "dur": 25.015, "args": { "External id": 16771,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650723941.530, "dur": 3.753, "args": { "External id": 16772,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650723944.213, "dur": 0.844, "args": { "External id": 16773,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650723946.294, "dur": 26.296, "args": { "External id": 16774,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650723948.112, "dur": 1.782, "args": { "External id": 16775,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650723953.049, "dur": 19.253, "args": { "External id": 16776,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650723957.375, "dur": 2.712, "args": { "External id": 16777,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650723973.840, "dur": 58.985, "args": { "External id": 16778,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650724035.667, "dur": 15.434, "args": { "External id": 16779,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650724054.278, "dur": 15.023, "args": { "External id": 16780,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650724071.309, "dur": 13.999, "args": { "External id": 16781,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650724087.560, "dur": 24.378, "args": { "External id": 16782,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650724089.751, "dur": 2.026, "args": { "External id": 16783,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650724095.581, "dur": 0.817, "args": { "External id": 16784,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650724113.226, "dur": 12.920, "args": { "External id": 16785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650724127.417, "dur": 11.278, "args": { "External id": 16786,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650724148.844, "dur": 2.661, "args": { "External id": 16787,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650724161.248, "dur": 3.769, "args": { "External id": 16788,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650724163.899, "dur": 0.441, "args": { "External id": 16789,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650724250.018, "dur": 67.803, "args": { "External id": 16790,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650724324.031, "dur": 9.495, "args": { "External id": 16791,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650724329.687, "dur": 2.243, "args": { "External id": 16792,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650724335.139, "dur": 29.094, "args": { "External id": 16793,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650724370.215, "dur": 5.865, "args": { "External id": 16794,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650724371.901, "dur": 3.447, "args": { "External id": 16795,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650724373.838, "dur": 1.336, "args": { "External id": 16796,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650724379.054, "dur": 42.957, "args": { "External id": 16797,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650724380.497, "dur": 40.946, "args": { "External id": 16798,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650724428.709, "dur": 15.750, "args": { "External id": 16799,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650724450.897, "dur": 4.363, "args": { "External id": 16800,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650724453.508, "dur": 0.779, "args": { "External id": 16801,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650724459.394, "dur": 50.237, "args": { "External id": 16802,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650724460.153, "dur": 7.173, "args": { "External id": 16803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650724460.886, "dur": 5.855, "args": { "External id": 16804,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650724464.040, "dur": 2.485, "args": { "External id": 16805,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650724468.030, "dur": 41.241, "args": { "External id": 16806,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650724469.030, "dur": 39.651, "args": { "External id": 16807,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650724513.673, "dur": 4.390, "args": { "External id": 16808,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650724516.005, "dur": 0.882, "args": { "External id": 16809,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650724524.223, "dur": 1.795, "args": { "External id": 16810,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650724534.492, "dur": 9.033, "args": { "External id": 16811,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650724538.408, "dur": 4.850, "args": { "External id": 16812,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650724627.677, "dur": 193.193, "args": { "External id": 16813,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650724630.168, "dur": 2.021, "args": { "External id": 16814,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650724634.013, "dur": 186.395, "args": { "External id": 16815,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650724635.380, "dur": 0.624, "args": { "External id": 16816,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650724639.957, "dur": 22.680, "args": { "External id": 16817,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650724664.524, "dur": 3.767, "args": { "External id": 16818,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650724666.942, "dur": 1.053, "args": { "External id": 16819,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650724669.150, "dur": 27.735, "args": { "External id": 16820,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650724670.740, "dur": 3.473, "args": { "External id": 16821,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650724677.955, "dur": 18.568, "args": { "External id": 16822,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650724680.274, "dur": 3.050, "args": { "External id": 16823,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650724698.201, "dur": 21.771, "args": { "External id": 16824,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650724721.816, "dur": 13.503, "args": { "External id": 16825,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650724737.526, "dur": 16.269, "args": { "External id": 16826,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650724755.029, "dur": 13.459, "args": { "External id": 16827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650724770.142, "dur": 22.079, "args": { "External id": 16828,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650724772.094, "dur": 1.647, "args": { "External id": 16829,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650724777.569, "dur": 0.739, "args": { "External id": 16830,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650724793.553, "dur": 12.880, "args": { "External id": 16831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650724807.502, "dur": 11.884, "args": { "External id": 16832,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650724827.617, "dur": 2.025, "args": { "External id": 16833,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650724837.581, "dur": 3.330, "args": { "External id": 16834,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650724839.725, "dur": 0.444, "args": { "External id": 16835,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650724898.695, "dur": 47.019, "args": { "External id": 16836,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650724950.156, "dur": 6.769, "args": { "External id": 16837,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650724954.773, "dur": 1.163, "args": { "External id": 16838,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650724958.406, "dur": 22.973, "args": { "External id": 16839,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650725023.627, "dur": 8.346, "args": { "External id": 16840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650725025.023, "dur": 5.927, "args": { "External id": 16841,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650725027.062, "dur": 3.462, "args": { "External id": 16842,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650725035.181, "dur": 50.896, "args": { "External id": 16843,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650725038.341, "dur": 46.944, "args": { "External id": 16844,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650725090.885, "dur": 20.836, "args": { "External id": 16845,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650725118.057, "dur": 4.446, "args": { "External id": 16846,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650725120.450, "dur": 1.053, "args": { "External id": 16847,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336757, "tid": 1336757, "ts": 1295650725126.456, "dur": 50.991, "args": { "External id": 16848,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650725127.328, "dur": 6.262, "args": { "External id": 16849,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650725128.388, "dur": 4.695, "args": { "External id": 16850,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650725131.746, "dur": 1.192, "args": { "External id": 16851,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650725134.190, "dur": 42.813, "args": { "External id": 16852,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650725135.063, "dur": 41.367, "args": { "External id": 16853,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650725181.411, "dur": 4.697, "args": { "External id": 16854,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650725183.953, "dur": 0.921, "args": { "External id": 16855,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650725192.200, "dur": 1.712, "args": { "External id": 16856,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336757, "tid": 1336757, "ts": 1295650725203.545, "dur": 6.491, "args": { "External id": 16857,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650725205.480, "dur": 4.273, "args": { "External id": 16858,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650725333.491, "dur": 204.414, "args": { "External id": 16859,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650725336.078, "dur": 3.712, "args": { "External id": 16860,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336757, "tid": 1336757, "ts": 1295650725344.306, "dur": 193.114, "args": { "External id": 16861,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336757, "tid": 1336757, "ts": 1295650725345.848, "dur": 0.544, "args": { "External id": 16862,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336757, "tid": 1336757, "ts": 1295650725349.968, "dur": 27.930, "args": { "External id": 16863,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336757, "tid": 1336757, "ts": 1295650725379.265, "dur": 5.915, "args": { "External id": 16864,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650725381.550, "dur": 3.173, "args": { "External id": 16865,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650725386.257, "dur": 22.916, "args": { "External id": 16866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295650725387.837, "dur": 2.024, "args": { "External id": 16867,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295650725390.967, "dur": 17.934, "args": { "External id": 16868,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650725393.605, "dur": 2.941, "args": { "External id": 16869,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295650725410.920, "dur": 22.584, "args": { "External id": 16870,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650725435.109, "dur": 15.292, "args": { "External id": 16871,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336757, "tid": 1336757, "ts": 1295650725453.518, "dur": 14.278, "args": { "External id": 16872,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336757, "tid": 1336757, "ts": 1295650725471.803, "dur": 14.335, "args": { "External id": 16873,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650725487.724, "dur": 21.879, "args": { "External id": 16874,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295650725489.965, "dur": 1.906, "args": { "External id": 16875,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650725493.760, "dur": 1.134, "args": { "External id": 16876,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336757, "tid": 1336757, "ts": 1295650725511.224, "dur": 13.334, "args": { "External id": 16877,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650725525.800, "dur": 10.549, "args": { "External id": 16878,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295650725547.006, "dur": 2.002, "args": { "External id": 16879,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650725558.189, "dur": 3.902, "args": { "External id": 16880,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650725560.695, "dur": 0.560, "args": { "External id": 16881,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650725627.945, "dur": 56.596, "args": { "External id": 16882,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336757, "tid": 1336757, "ts": 1295650725689.672, "dur": 6.930, "args": { "External id": 16883,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650725692.568, "dur": 2.836, "args": { "External id": 16884,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650725698.014, "dur": 25.640, "args": { "External id": 16885,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336757, "tid": 1336757, "ts": 1295650725728.673, "dur": 7.968, "args": { "External id": 16886,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336757, "tid": 1336757, "ts": 1295650725730.044, "dur": 5.982, "args": { "External id": 16887,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650725734.180, "dur": 1.619, "args": { "External id": 16888,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336757, "tid": 1336757, "ts": 1295650725739.749, "dur": 39.610, "args": { "External id": 16889,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336757, "tid": 1336757, "ts": 1295650725740.771, "dur": 37.995, "args": { "External id": 16890,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650725783.869, "dur": 15.161, "args": { "External id": 16891,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650725804.071, "dur": 25.128, "args": { "External id": 16892,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336757, "tid": 1336757, "ts": 1295650725806.525, "dur": 22.300, "args": { "External id": 16893,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650725811.721, "dur": 0.915, "args": { "External id": 16894,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295650725835.269, "dur": 75.479, "args": { "External id": 16895,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 10390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336757, "tid": 1336757, "ts": 1295650725837.162, "dur": 73.376, "args": { "External id": 16896,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 10391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650725888.878, "dur": 4.940, "args": { "External id": 16897,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295650725895.026, "dur": 15.037, "args": { "External id": 16898,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1336757, "ts": 1295650725923.243, "dur": 5.306, "args": { "External id": 16899,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 10394 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1336757, "ts": 1295650725925.291, "dur": 2.942, "args": { "External id": 16900,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 10395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336757, "tid": 1336757, "ts": 1295650725929.532, "dur": 0.847, "args": { "External id": 16901,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10396 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336757, "tid": 1336757, "ts": 1295650725929.866, "dur": 0.438, "args": { "External id": 16902,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650725972.297, "dur": 63.506, "args": { "External id": 16903,"Sequence number": 246768, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336757, "tid": 1336757, "ts": 1295650726039.447, "dur": 17.159, "args": { "External id": 16904,"Sequence number": 246769, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10399 } }, { "ph": "s", "id": 2, "pid": 1336757, "tid": 1336757, "ts": 1295650726039.447, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward", "pid": 1336757, "tid": 1336757, "ts": 1295650726164.709, "dur": 39.710, "args": { "External id": 16905,"Record function id": 0, "Ev Idx": 10400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336757, "tid": 1336757, "ts": 1295650726346.985, "dur": 42.662, "args": { "External id": 16906,"Sequence number": 246770, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 10401 } }, { "ph": "s", "id": 1, "pid": 1336757, "tid": 1336757, "ts": 1295650726346.985, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::ones_like", "pid": 1336757, "tid": 1336757, "ts": 1295650726449.631, "dur": 28.541, "args": { "External id": 16907,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "1"], "Input type": ["float", "", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[1], [], [], [], [], []], "Ev Idx": 10402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295650726451.277, "dur": 9.805, "args": { "External id": 16908,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "1"], "Input type": ["float", "", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[1], [], [], [], [], []], "Ev Idx": 10403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336757, "tid": 1336757, "ts": 1295650726456.584, "dur": 3.843, "args": { "External id": 16909,"Record function id": 0, "Concrete Inputs": ["[1]", "[1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295650726462.498, "dur": 15.389, "args": { "External id": 16910,"Record function id": 0, "Concrete Inputs": ["", "1."], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 10405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336757, "tid": 1336757, "ts": 1295652033267.569, "dur": 87.790, "args": { "External id": 16911,"Sequence number": 246771, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336757, "tid": 1336757, "ts": 1295652033369.132, "dur": 27.936, "args": { "External id": 16912,"Sequence number": 246772, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 10407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1336757, "ts": 1295652033405.714, "dur": 24.203, "args": { "External id": 16913,"Sequence number": 246773, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1336757, "ts": 1295652033957.437, "dur": 23.701, "args": { "External id": 16914,"Sequence number": 246774, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 10409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1336757, "ts": 1295652034428.849, "dur": 46.835, "args": { "External id": 16915,"Sequence number": 246775, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_norm", "pid": 1336757, "tid": 1336757, "ts": 1295652036024.529, "dur": 3316.358, "args": { "External id": 16916,"Record function id": 0, "Concrete Inputs": ["", "2.", ""], "Input type": ["TensorList", "Scalar", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 10411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_norm", "pid": 1336757, "tid": 1336757, "ts": 1295652036629.596, "dur": 1082.146, "args": { "External id": 16917,"Record function id": 0, "Concrete Inputs": ["", "2.", ""], "Input type": ["TensorList", "Scalar", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 10412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336757, "tid": 1336757, "ts": 1295652036649.087, "dur": 65.722, "args": { "External id": 16918,"Record function id": 0, "Concrete Inputs": ["[36375]", "6", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 10413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295652036652.395, "dur": 12.275, "args": { "External id": 16919,"Record function id": 0, "Concrete Inputs": ["[36375]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336757, "tid": 1336757, "ts": 1295652036667.931, "dur": 46.544, "args": { "External id": 16920,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[36375]], "Ev Idx": 10415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336757, "tid": 1336757, "ts": 1295652036669.999, "dur": 43.888, "args": { "External id": 16921,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[36375], []], "Ev Idx": 10416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039379.990, "dur": 3.187, "args": { "External id": 16922,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039385.344, "dur": 0.324, "args": { "External id": 16923,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039386.951, "dur": 0.410, "args": { "External id": 16924,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039388.711, "dur": 0.413, "args": { "External id": 16925,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039390.394, "dur": 0.426, "args": { "External id": 16926,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039392.135, "dur": 0.397, "args": { "External id": 16927,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039393.745, "dur": 0.345, "args": { "External id": 16928,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039397.450, "dur": 0.374, "args": { "External id": 16929,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039398.852, "dur": 0.334, "args": { "External id": 16930,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039400.369, "dur": 0.176, "args": { "External id": 16931,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039401.355, "dur": 0.401, "args": { "External id": 16932,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039403.027, "dur": 0.426, "args": { "External id": 16933,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039404.179, "dur": 0.385, "args": { "External id": 16934,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039405.734, "dur": 0.322, "args": { "External id": 16935,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039406.805, "dur": 0.199, "args": { "External id": 16936,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039409.916, "dur": 0.211, "args": { "External id": 16937,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039410.843, "dur": 0.414, "args": { "External id": 16938,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039412.326, "dur": 0.199, "args": { "External id": 16939,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039413.231, "dur": 0.415, "args": { "External id": 16940,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039414.395, "dur": 0.440, "args": { "External id": 16941,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039415.868, "dur": 0.448, "args": { "External id": 16942,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039417.249, "dur": 0.472, "args": { "External id": 16943,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039418.429, "dur": 0.427, "args": { "External id": 16944,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039421.796, "dur": 0.209, "args": { "External id": 16945,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039422.729, "dur": 0.411, "args": { "External id": 16946,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039424.217, "dur": 0.212, "args": { "External id": 16947,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039425.490, "dur": 0.206, "args": { "External id": 16948,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039426.646, "dur": 0.222, "args": { "External id": 16949,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039427.885, "dur": 0.210, "args": { "External id": 16950,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039428.803, "dur": 0.199, "args": { "External id": 16951,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039429.875, "dur": 0.204, "args": { "External id": 16952,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039433.219, "dur": 0.213, "args": { "External id": 16953,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039434.298, "dur": 0.205, "args": { "External id": 16954,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039435.850, "dur": 0.200, "args": { "External id": 16955,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039436.944, "dur": 0.209, "args": { "External id": 16956,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039437.872, "dur": 0.201, "args": { "External id": 16957,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039439.003, "dur": 0.224, "args": { "External id": 16958,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039439.970, "dur": 0.210, "args": { "External id": 16959,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039440.894, "dur": 0.218, "args": { "External id": 16960,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039443.681, "dur": 0.207, "args": { "External id": 16961,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039444.938, "dur": 0.209, "args": { "External id": 16962,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039446.328, "dur": 0.202, "args": { "External id": 16963,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039447.465, "dur": 0.204, "args": { "External id": 16964,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039448.573, "dur": 0.439, "args": { "External id": 16965,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039450.115, "dur": 0.414, "args": { "External id": 16966,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039452.876, "dur": 0.496, "args": { "External id": 16967,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039454.120, "dur": 0.422, "args": { "External id": 16968,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039457.452, "dur": 0.204, "args": { "External id": 16969,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039458.591, "dur": 0.203, "args": { "External id": 16970,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039459.547, "dur": 0.411, "args": { "External id": 16971,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039460.654, "dur": 0.411, "args": { "External id": 16972,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039461.765, "dur": 0.195, "args": { "External id": 16973,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039462.899, "dur": 0.200, "args": { "External id": 16974,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039464.408, "dur": 0.199, "args": { "External id": 16975,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039465.319, "dur": 0.199, "args": { "External id": 16976,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039468.258, "dur": 0.199, "args": { "External id": 16977,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039469.377, "dur": 0.209, "args": { "External id": 16978,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039470.474, "dur": 0.196, "args": { "External id": 16979,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039471.376, "dur": 0.203, "args": { "External id": 16980,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039472.279, "dur": 0.207, "args": { "External id": 16981,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039473.219, "dur": 0.201, "args": { "External id": 16982,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039474.149, "dur": 0.200, "args": { "External id": 16983,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039475.269, "dur": 0.596, "args": { "External id": 16984,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039478.899, "dur": 0.195, "args": { "External id": 16985,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039479.790, "dur": 0.382, "args": { "External id": 16986,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039481.349, "dur": 0.394, "args": { "External id": 16987,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039482.497, "dur": 0.383, "args": { "External id": 16988,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039483.712, "dur": 0.364, "args": { "External id": 16989,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039485.088, "dur": 0.392, "args": { "External id": 16990,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039486.254, "dur": 0.407, "args": { "External id": 16991,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039487.357, "dur": 0.399, "args": { "External id": 16992,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039490.413, "dur": 0.363, "args": { "External id": 16993,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039491.652, "dur": 0.404, "args": { "External id": 16994,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039492.769, "dur": 0.196, "args": { "External id": 16995,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039493.656, "dur": 0.221, "args": { "External id": 16996,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039494.987, "dur": 0.223, "args": { "External id": 16997,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039496.151, "dur": 0.205, "args": { "External id": 16998,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039497.960, "dur": 0.215, "args": { "External id": 16999,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039499.109, "dur": 0.198, "args": { "External id": 17000,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039502.249, "dur": 0.199, "args": { "External id": 17001,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039503.146, "dur": 0.200, "args": { "External id": 17002,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039504.078, "dur": 0.197, "args": { "External id": 17003,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039504.967, "dur": 0.197, "args": { "External id": 17004,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039506.044, "dur": 0.202, "args": { "External id": 17005,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039507.061, "dur": 0.196, "args": { "External id": 17006,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039508.083, "dur": 0.201, "args": { "External id": 17007,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039509.049, "dur": 0.203, "args": { "External id": 17008,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039512.202, "dur": 0.205, "args": { "External id": 17009,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039513.097, "dur": 0.413, "args": { "External id": 17010,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039514.205, "dur": 0.439, "args": { "External id": 17011,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039515.388, "dur": 0.364, "args": { "External id": 17012,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039516.475, "dur": 0.207, "args": { "External id": 17013,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039517.426, "dur": 0.432, "args": { "External id": 17014,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039519.163, "dur": 0.407, "args": { "External id": 17015,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039520.333, "dur": 0.384, "args": { "External id": 17016,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039523.634, "dur": 0.204, "args": { "External id": 17017,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039524.587, "dur": 0.411, "args": { "External id": 17018,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039525.717, "dur": 0.439, "args": { "External id": 17019,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039526.857, "dur": 0.409, "args": { "External id": 17020,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039527.998, "dur": 0.206, "args": { "External id": 17021,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039528.907, "dur": 0.197, "args": { "External id": 17022,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039529.809, "dur": 0.367, "args": { "External id": 17023,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039530.915, "dur": 0.398, "args": { "External id": 17024,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039534.376, "dur": 0.413, "args": { "External id": 17025,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039535.509, "dur": 0.365, "args": { "External id": 17026,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039536.569, "dur": 0.202, "args": { "External id": 17027,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039537.476, "dur": 0.351, "args": { "External id": 17028,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039538.548, "dur": 0.346, "args": { "External id": 17029,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039539.766, "dur": 0.341, "args": { "External id": 17030,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039541.465, "dur": 0.244, "args": { "External id": 17031,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039542.559, "dur": 0.218, "args": { "External id": 17032,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039545.673, "dur": 0.204, "args": { "External id": 17033,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039546.598, "dur": 0.196, "args": { "External id": 17034,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039547.509, "dur": 0.197, "args": { "External id": 17035,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039548.422, "dur": 0.198, "args": { "External id": 17036,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039549.315, "dur": 0.200, "args": { "External id": 17037,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039550.609, "dur": 0.198, "args": { "External id": 17038,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039551.538, "dur": 0.197, "args": { "External id": 17039,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039552.427, "dur": 0.221, "args": { "External id": 17040,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039555.158, "dur": 0.196, "args": { "External id": 17041,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039556.103, "dur": 0.199, "args": { "External id": 17042,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039557.001, "dur": 0.201, "args": { "External id": 17043,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039557.924, "dur": 0.197, "args": { "External id": 17044,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039559.008, "dur": 0.197, "args": { "External id": 17045,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039560.118, "dur": 0.200, "args": { "External id": 17046,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039561.132, "dur": 0.198, "args": { "External id": 17047,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039562.035, "dur": 0.199, "args": { "External id": 17048,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039564.964, "dur": 0.203, "args": { "External id": 17049,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039565.875, "dur": 0.202, "args": { "External id": 17050,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039567.187, "dur": 0.210, "args": { "External id": 17051,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039568.135, "dur": 0.203, "args": { "External id": 17052,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039569.151, "dur": 0.204, "args": { "External id": 17053,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039570.092, "dur": 0.200, "args": { "External id": 17054,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039571.004, "dur": 0.203, "args": { "External id": 17055,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039571.924, "dur": 0.200, "args": { "External id": 17056,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039574.842, "dur": 0.225, "args": { "External id": 17057,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039575.927, "dur": 0.198, "args": { "External id": 17058,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039576.822, "dur": 0.202, "args": { "External id": 17059,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039577.747, "dur": 0.199, "args": { "External id": 17060,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039578.669, "dur": 0.202, "args": { "External id": 17061,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039579.567, "dur": 0.201, "args": { "External id": 17062,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039580.482, "dur": 0.198, "args": { "External id": 17063,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039581.550, "dur": 0.201, "args": { "External id": 17064,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039584.733, "dur": 0.208, "args": { "External id": 17065,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039585.683, "dur": 0.198, "args": { "External id": 17066,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039586.620, "dur": 0.413, "args": { "External id": 17067,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039588.232, "dur": 0.170, "args": { "External id": 17068,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039589.098, "dur": 0.375, "args": { "External id": 17069,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039590.365, "dur": 0.472, "args": { "External id": 17070,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039591.938, "dur": 0.461, "args": { "External id": 17071,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039593.105, "dur": 0.383, "args": { "External id": 17072,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039596.259, "dur": 0.203, "args": { "External id": 17073,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039597.323, "dur": 0.365, "args": { "External id": 17074,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039598.386, "dur": 0.377, "args": { "External id": 17075,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039599.464, "dur": 0.404, "args": { "External id": 17076,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039600.579, "dur": 0.202, "args": { "External id": 17077,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039601.701, "dur": 0.196, "args": { "External id": 17078,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039602.824, "dur": 0.227, "args": { "External id": 17079,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039603.780, "dur": 0.202, "args": { "External id": 17080,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039608.252, "dur": 0.208, "args": { "External id": 17081,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039609.184, "dur": 0.198, "args": { "External id": 17082,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039610.225, "dur": 0.400, "args": { "External id": 17083,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039611.557, "dur": 0.412, "args": { "External id": 17084,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039612.742, "dur": 0.402, "args": { "External id": 17085,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039613.862, "dur": 0.376, "args": { "External id": 17086,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039615.018, "dur": 0.410, "args": { "External id": 17087,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039616.122, "dur": 0.576, "args": { "External id": 17088,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039619.480, "dur": 0.202, "args": { "External id": 17089,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039620.393, "dur": 0.526, "args": { "External id": 17090,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039621.827, "dur": 0.409, "args": { "External id": 17091,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039622.984, "dur": 0.368, "args": { "External id": 17092,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039624.281, "dur": 0.203, "args": { "External id": 17093,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039625.180, "dur": 0.199, "args": { "External id": 17094,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039626.590, "dur": 0.208, "args": { "External id": 17095,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039627.491, "dur": 0.206, "args": { "External id": 17096,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039630.555, "dur": 0.197, "args": { "External id": 17097,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039631.480, "dur": 0.200, "args": { "External id": 17098,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039632.385, "dur": 0.205, "args": { "External id": 17099,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039633.313, "dur": 0.198, "args": { "External id": 17100,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039634.213, "dur": 0.203, "args": { "External id": 17101,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039635.124, "dur": 0.206, "args": { "External id": 17102,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039636.277, "dur": 0.199, "args": { "External id": 17103,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039637.183, "dur": 0.222, "args": { "External id": 17104,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039640.082, "dur": 0.202, "args": { "External id": 17105,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039640.979, "dur": 0.201, "args": { "External id": 17106,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039641.875, "dur": 0.233, "args": { "External id": 17107,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039642.796, "dur": 0.204, "args": { "External id": 17108,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039643.696, "dur": 0.206, "args": { "External id": 17109,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039644.596, "dur": 0.199, "args": { "External id": 17110,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039645.490, "dur": 0.200, "args": { "External id": 17111,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039646.417, "dur": 0.204, "args": { "External id": 17112,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039649.411, "dur": 0.199, "args": { "External id": 17113,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039650.499, "dur": 0.201, "args": { "External id": 17114,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039651.406, "dur": 0.202, "args": { "External id": 17115,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039652.315, "dur": 0.195, "args": { "External id": 17116,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039653.212, "dur": 0.201, "args": { "External id": 17117,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039654.307, "dur": 0.229, "args": { "External id": 17118,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039655.328, "dur": 0.201, "args": { "External id": 17119,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039656.269, "dur": 0.252, "args": { "External id": 17120,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039659.115, "dur": 0.200, "args": { "External id": 17121,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039660.039, "dur": 0.200, "args": { "External id": 17122,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039661.359, "dur": 0.204, "args": { "External id": 17123,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039662.308, "dur": 0.200, "args": { "External id": 17124,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039663.247, "dur": 0.206, "args": { "External id": 17125,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039664.150, "dur": 0.198, "args": { "External id": 17126,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039665.106, "dur": 0.221, "args": { "External id": 17127,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039666.076, "dur": 0.201, "args": { "External id": 17128,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039668.947, "dur": 0.204, "args": { "External id": 17129,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039669.850, "dur": 0.200, "args": { "External id": 17130,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039670.855, "dur": 0.200, "args": { "External id": 17131,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039671.938, "dur": 0.195, "args": { "External id": 17132,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039673.012, "dur": 0.200, "args": { "External id": 17133,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039674.087, "dur": 0.223, "args": { "External id": 17134,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039675.161, "dur": 0.373, "args": { "External id": 17135,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039676.255, "dur": 0.348, "args": { "External id": 17136,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039679.274, "dur": 0.205, "args": { "External id": 17137,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039680.170, "dur": 0.200, "args": { "External id": 17138,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039681.259, "dur": 0.414, "args": { "External id": 17139,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039682.399, "dur": 0.407, "args": { "External id": 17140,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039683.496, "dur": 0.410, "args": { "External id": 17141,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039684.652, "dur": 0.387, "args": { "External id": 17142,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039685.754, "dur": 0.449, "args": { "External id": 17143,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039686.954, "dur": 0.405, "args": { "External id": 17144,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039690.190, "dur": 0.198, "args": { "External id": 17145,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039691.134, "dur": 0.376, "args": { "External id": 17146,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039692.214, "dur": 0.416, "args": { "External id": 17147,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039693.335, "dur": 0.402, "args": { "External id": 17148,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039694.612, "dur": 0.199, "args": { "External id": 17149,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039695.537, "dur": 0.203, "args": { "External id": 17150,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039696.466, "dur": 0.202, "args": { "External id": 17151,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039697.436, "dur": 0.201, "args": { "External id": 17152,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039700.712, "dur": 0.201, "args": { "External id": 17153,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039701.607, "dur": 0.223, "args": { "External id": 17154,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039702.879, "dur": 0.200, "args": { "External id": 17155,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039703.793, "dur": 0.467, "args": { "External id": 17156,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039704.950, "dur": 0.390, "args": { "External id": 17157,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039706.043, "dur": 0.402, "args": { "External id": 17158,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039707.169, "dur": 0.400, "args": { "External id": 17159,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039708.295, "dur": 0.429, "args": { "External id": 17160,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039711.446, "dur": 0.204, "args": { "External id": 17161,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039712.334, "dur": 0.558, "args": { "External id": 17162,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039713.603, "dur": 0.371, "args": { "External id": 17163,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039714.915, "dur": 0.161, "args": { "External id": 17164,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039715.764, "dur": 0.398, "args": { "External id": 17165,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039716.845, "dur": 0.200, "args": { "External id": 17166,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039717.769, "dur": 0.218, "args": { "External id": 17167,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039718.758, "dur": 0.196, "args": { "External id": 17168,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039721.506, "dur": 0.206, "args": { "External id": 17169,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039722.457, "dur": 0.200, "args": { "External id": 17170,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039723.369, "dur": 0.198, "args": { "External id": 17171,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039724.333, "dur": 0.210, "args": { "External id": 17172,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039725.291, "dur": 0.196, "args": { "External id": 17173,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039726.498, "dur": 0.199, "args": { "External id": 17174,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039727.617, "dur": 0.203, "args": { "External id": 17175,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039728.545, "dur": 0.199, "args": { "External id": 17176,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039731.490, "dur": 0.196, "args": { "External id": 17177,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039737.721, "dur": 0.207, "args": { "External id": 17178,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039738.895, "dur": 0.219, "args": { "External id": 17179,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039740.032, "dur": 0.196, "args": { "External id": 17180,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039740.931, "dur": 0.197, "args": { "External id": 17181,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039741.997, "dur": 0.201, "args": { "External id": 17182,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039742.983, "dur": 0.198, "args": { "External id": 17183,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039743.866, "dur": 0.197, "args": { "External id": 17184,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039746.759, "dur": 0.238, "args": { "External id": 17185,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039747.706, "dur": 0.202, "args": { "External id": 17186,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039748.677, "dur": 0.217, "args": { "External id": 17187,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039749.583, "dur": 0.202, "args": { "External id": 17188,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039750.497, "dur": 0.203, "args": { "External id": 17189,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039751.629, "dur": 0.274, "args": { "External id": 17190,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039752.858, "dur": 0.209, "args": { "External id": 17191,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039753.773, "dur": 0.204, "args": { "External id": 17192,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039756.396, "dur": 0.204, "args": { "External id": 17193,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039757.319, "dur": 0.218, "args": { "External id": 17194,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039759.668, "dur": 0.206, "args": { "External id": 17195,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039760.594, "dur": 0.199, "args": { "External id": 17196,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039761.560, "dur": 0.196, "args": { "External id": 17197,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039762.453, "dur": 0.203, "args": { "External id": 17198,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039763.355, "dur": 0.197, "args": { "External id": 17199,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039764.281, "dur": 0.197, "args": { "External id": 17200,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039767.629, "dur": 0.200, "args": { "External id": 17201,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039768.556, "dur": 0.201, "args": { "External id": 17202,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039769.456, "dur": 0.201, "args": { "External id": 17203,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039770.358, "dur": 0.201, "args": { "External id": 17204,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039771.302, "dur": 0.194, "args": { "External id": 17205,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039772.219, "dur": 0.199, "args": { "External id": 17206,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039773.109, "dur": 0.225, "args": { "External id": 17207,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039774.056, "dur": 0.272, "args": { "External id": 17208,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039777.051, "dur": 0.320, "args": { "External id": 17209,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039778.146, "dur": 0.205, "args": { "External id": 17210,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039779.049, "dur": 0.406, "args": { "External id": 17211,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652039780.172, "dur": 0.197, "args": { "External id": 17212,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 1336757, "tid": 1336757, "ts": 1295652039836.645, "dur": 1630.814, "args": { "External id": 17213,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 1336757, "tid": 1336757, "ts": 1295652040356.153, "dur": 1023.595, "args": { "External id": 17214,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040365.046, "dur": 8.925, "args": { "External id": 17215,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040369.447, "dur": 3.727, "args": { "External id": 17216,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040374.643, "dur": 3.995, "args": { "External id": 17217,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040375.808, "dur": 2.503, "args": { "External id": 17218,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040379.243, "dur": 3.229, "args": { "External id": 17219,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040381.421, "dur": 0.953, "args": { "External id": 17220,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040383.008, "dur": 1.459, "args": { "External id": 17221,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040383.863, "dur": 0.526, "args": { "External id": 17222,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040386.731, "dur": 4.483, "args": { "External id": 17223,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040390.807, "dur": 0.329, "args": { "External id": 17224,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040391.500, "dur": 1.176, "args": { "External id": 17225,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040391.935, "dur": 0.668, "args": { "External id": 17226,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040393.228, "dur": 1.225, "args": { "External id": 17227,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040393.599, "dur": 0.778, "args": { "External id": 17228,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040395.083, "dur": 3.097, "args": { "External id": 17229,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040397.556, "dur": 0.548, "args": { "External id": 17230,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040398.614, "dur": 1.382, "args": { "External id": 17231,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040399.201, "dur": 0.717, "args": { "External id": 17232,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040400.414, "dur": 2.722, "args": { "External id": 17233,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040400.804, "dur": 2.259, "args": { "External id": 17234,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040403.381, "dur": 2.609, "args": { "External id": 17235,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040405.322, "dur": 0.604, "args": { "External id": 17236,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040406.485, "dur": 1.568, "args": { "External id": 17237,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040406.832, "dur": 1.142, "args": { "External id": 17238,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040410.465, "dur": 4.856, "args": { "External id": 17239,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040414.692, "dur": 0.556, "args": { "External id": 17240,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040415.782, "dur": 1.245, "args": { "External id": 17241,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040416.278, "dur": 0.676, "args": { "External id": 17242,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040417.679, "dur": 0.892, "args": { "External id": 17243,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040418.076, "dur": 0.418, "args": { "External id": 17244,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040419.226, "dur": 3.063, "args": { "External id": 17245,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040421.987, "dur": 0.225, "args": { "External id": 17246,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040422.813, "dur": 1.061, "args": { "External id": 17247,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040423.183, "dur": 0.622, "args": { "External id": 17248,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040424.290, "dur": 2.615, "args": { "External id": 17249,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040424.665, "dur": 2.163, "args": { "External id": 17250,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040427.196, "dur": 1.743, "args": { "External id": 17251,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040428.485, "dur": 0.374, "args": { "External id": 17252,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040429.181, "dur": 0.704, "args": { "External id": 17253,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040429.546, "dur": 0.265, "args": { "External id": 17254,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040432.246, "dur": 4.650, "args": { "External id": 17255,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040436.418, "dur": 0.405, "args": { "External id": 17256,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040437.337, "dur": 1.089, "args": { "External id": 17257,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040437.740, "dur": 0.618, "args": { "External id": 17258,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040438.986, "dur": 1.261, "args": { "External id": 17259,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040439.353, "dur": 0.816, "args": { "External id": 17260,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040440.745, "dur": 4.632, "args": { "External id": 17261,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040444.786, "dur": 0.525, "args": { "External id": 17262,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040446.011, "dur": 0.814, "args": { "External id": 17263,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040446.533, "dur": 0.213, "args": { "External id": 17264,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040447.243, "dur": 3.039, "args": { "External id": 17265,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040447.655, "dur": 2.544, "args": { "External id": 17266,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040450.746, "dur": 2.301, "args": { "External id": 17267,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040452.620, "dur": 0.351, "args": { "External id": 17268,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040453.272, "dur": 0.941, "args": { "External id": 17269,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040453.618, "dur": 0.525, "args": { "External id": 17270,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040456.903, "dur": 4.968, "args": { "External id": 17271,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040461.257, "dur": 0.543, "args": { "External id": 17272,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040462.309, "dur": 1.440, "args": { "External id": 17273,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040462.802, "dur": 0.874, "args": { "External id": 17274,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040464.192, "dur": 1.433, "args": { "External id": 17275,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040464.733, "dur": 0.824, "args": { "External id": 17276,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040466.104, "dur": 3.332, "args": { "External id": 17277,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040468.922, "dur": 0.445, "args": { "External id": 17278,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040469.994, "dur": 0.823, "args": { "External id": 17279,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040470.347, "dur": 0.405, "args": { "External id": 17280,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040471.238, "dur": 2.802, "args": { "External id": 17281,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040471.591, "dur": 2.205, "args": { "External id": 17282,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040474.347, "dur": 3.691, "args": { "External id": 17283,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040477.582, "dur": 0.391, "args": { "External id": 17284,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040478.463, "dur": 2.664, "args": { "External id": 17285,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040478.824, "dur": 2.225, "args": { "External id": 17286,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040483.473, "dur": 2.726, "args": { "External id": 17287,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040485.517, "dur": 0.608, "args": { "External id": 17288,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040486.587, "dur": 1.644, "args": { "External id": 17289,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040487.131, "dur": 1.029, "args": { "External id": 17290,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040488.461, "dur": 3.058, "args": { "External id": 17291,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040491.102, "dur": 0.345, "args": { "External id": 17292,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040491.762, "dur": 2.449, "args": { "External id": 17293,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040493.442, "dur": 0.700, "args": { "External id": 17294,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040494.599, "dur": 1.068, "args": { "External id": 17295,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040495.124, "dur": 0.471, "args": { "External id": 17296,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040496.056, "dur": 2.954, "args": { "External id": 17297,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040498.355, "dur": 0.586, "args": { "External id": 17298,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040499.248, "dur": 1.348, "args": { "External id": 17299,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040499.908, "dur": 0.620, "args": { "External id": 17300,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040500.821, "dur": 2.573, "args": { "External id": 17301,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040501.296, "dur": 2.020, "args": { "External id": 17302,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040506.101, "dur": 1.700, "args": { "External id": 17303,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040507.013, "dur": 0.722, "args": { "External id": 17304,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040508.207, "dur": 1.037, "args": { "External id": 17305,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040508.695, "dur": 0.476, "args": { "External id": 17306,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040509.636, "dur": 2.663, "args": { "External id": 17307,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040512.021, "dur": 0.203, "args": { "External id": 17308,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040512.749, "dur": 1.311, "args": { "External id": 17309,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040513.588, "dur": 0.403, "args": { "External id": 17310,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040514.321, "dur": 1.443, "args": { "External id": 17311,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040514.840, "dur": 0.854, "args": { "External id": 17312,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040516.034, "dur": 3.024, "args": { "External id": 17313,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040518.586, "dur": 0.402, "args": { "External id": 17314,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040519.284, "dur": 1.206, "args": { "External id": 17315,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040519.935, "dur": 0.491, "args": { "External id": 17316,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040520.906, "dur": 3.244, "args": { "External id": 17317,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040521.528, "dur": 2.292, "args": { "External id": 17318,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040526.420, "dur": 1.320, "args": { "External id": 17319,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040527.075, "dur": 0.598, "args": { "External id": 17320,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040528.141, "dur": 1.109, "args": { "External id": 17321,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040528.673, "dur": 0.507, "args": { "External id": 17322,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040529.660, "dur": 3.113, "args": { "External id": 17323,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040532.145, "dur": 0.559, "args": { "External id": 17324,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040533.177, "dur": 1.509, "args": { "External id": 17325,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040534.093, "dur": 0.523, "args": { "External id": 17326,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040534.913, "dur": 1.074, "args": { "External id": 17327,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040535.451, "dur": 0.464, "args": { "External id": 17328,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040536.212, "dur": 3.465, "args": { "External id": 17329,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040539.039, "dur": 0.573, "args": { "External id": 17330,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040539.900, "dur": 1.364, "args": { "External id": 17331,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040540.599, "dur": 0.594, "args": { "External id": 17332,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040541.657, "dur": 2.594, "args": { "External id": 17333,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040542.003, "dur": 2.174, "args": { "External id": 17334,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040546.495, "dur": 1.581, "args": { "External id": 17335,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040547.492, "dur": 0.512, "args": { "External id": 17336,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040548.299, "dur": 0.920, "args": { "External id": 17337,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040548.648, "dur": 0.500, "args": { "External id": 17338,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040549.485, "dur": 3.051, "args": { "External id": 17339,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040552.065, "dur": 0.401, "args": { "External id": 17340,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040552.778, "dur": 1.644, "args": { "External id": 17341,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040553.755, "dur": 0.602, "args": { "External id": 17342,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040555.058, "dur": 1.287, "args": { "External id": 17343,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040555.547, "dur": 0.725, "args": { "External id": 17344,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040556.957, "dur": 3.441, "args": { "External id": 17345,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040559.610, "dur": 0.725, "args": { "External id": 17346,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040560.906, "dur": 1.293, "args": { "External id": 17347,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040561.732, "dur": 0.397, "args": { "External id": 17348,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040562.690, "dur": 2.715, "args": { "External id": 17349,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040563.253, "dur": 2.075, "args": { "External id": 17350,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040567.691, "dur": 1.585, "args": { "External id": 17351,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040568.575, "dur": 0.629, "args": { "External id": 17352,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040569.517, "dur": 1.247, "args": { "External id": 17353,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040569.871, "dur": 0.825, "args": { "External id": 17354,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040571.004, "dur": 2.709, "args": { "External id": 17355,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040573.226, "dur": 0.417, "args": { "External id": 17356,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040573.955, "dur": 1.389, "args": { "External id": 17357,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040574.945, "dur": 0.325, "args": { "External id": 17358,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040575.569, "dur": 1.054, "args": { "External id": 17359,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040576.076, "dur": 0.472, "args": { "External id": 17360,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040576.844, "dur": 3.195, "args": { "External id": 17361,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040579.608, "dur": 0.362, "args": { "External id": 17362,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040580.541, "dur": 1.399, "args": { "External id": 17363,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040581.378, "dur": 0.488, "args": { "External id": 17364,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040582.648, "dur": 2.760, "args": { "External id": 17365,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040583.013, "dur": 2.126, "args": { "External id": 17366,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040587.801, "dur": 1.091, "args": { "External id": 17367,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040588.567, "dur": 0.256, "args": { "External id": 17368,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040589.116, "dur": 1.063, "args": { "External id": 17369,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040589.465, "dur": 0.646, "args": { "External id": 17370,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040590.405, "dur": 2.910, "args": { "External id": 17371,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040592.930, "dur": 0.311, "args": { "External id": 17372,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040593.556, "dur": 1.456, "args": { "External id": 17373,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040594.311, "dur": 0.639, "args": { "External id": 17374,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040595.238, "dur": 1.230, "args": { "External id": 17375,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040595.740, "dur": 0.655, "args": { "External id": 17376,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040596.865, "dur": 3.345, "args": { "External id": 17377,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040599.709, "dur": 0.427, "args": { "External id": 17378,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040600.641, "dur": 1.211, "args": { "External id": 17379,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040601.399, "dur": 0.384, "args": { "External id": 17380,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040602.242, "dur": 3.249, "args": { "External id": 17381,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040602.610, "dur": 2.634, "args": { "External id": 17382,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040607.665, "dur": 1.248, "args": { "External id": 17383,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040608.552, "dur": 0.289, "args": { "External id": 17384,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040609.140, "dur": 1.135, "args": { "External id": 17385,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040609.493, "dur": 0.711, "args": { "External id": 17386,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040610.504, "dur": 3.138, "args": { "External id": 17387,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040613.133, "dur": 0.435, "args": { "External id": 17388,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040613.915, "dur": 1.273, "args": { "External id": 17389,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040614.837, "dur": 0.277, "args": { "External id": 17390,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040615.586, "dur": 1.419, "args": { "External id": 17391,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040616.135, "dur": 0.797, "args": { "External id": 17392,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040617.625, "dur": 3.326, "args": { "External id": 17393,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040620.177, "dur": 0.704, "args": { "External id": 17394,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040621.394, "dur": 1.046, "args": { "External id": 17395,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040622.048, "dur": 0.324, "args": { "External id": 17396,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040622.665, "dur": 3.268, "args": { "External id": 17397,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040623.042, "dur": 2.618, "args": { "External id": 17398,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040628.147, "dur": 1.125, "args": { "External id": 17399,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040628.883, "dur": 0.318, "args": { "External id": 17400,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040629.496, "dur": 0.950, "args": { "External id": 17401,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040629.838, "dur": 0.537, "args": { "External id": 17402,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040630.682, "dur": 2.764, "args": { "External id": 17403,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040633.040, "dur": 0.336, "args": { "External id": 17404,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040633.685, "dur": 1.109, "args": { "External id": 17405,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040634.403, "dur": 0.320, "args": { "External id": 17406,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040635.190, "dur": 1.073, "args": { "External id": 17407,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040635.623, "dur": 0.568, "args": { "External id": 17408,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040663.980, "dur": 3.278, "args": { "External id": 23553,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040666.613, "dur": 0.572, "args": { "External id": 23554,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040667.736, "dur": 1.154, "args": { "External id": 23555,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040668.481, "dur": 0.335, "args": { "External id": 23556,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040669.114, "dur": 2.931, "args": { "External id": 23557,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040669.462, "dur": 2.508, "args": { "External id": 23558,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040674.217, "dur": 0.881, "args": { "External id": 23559,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040674.791, "dur": 0.238, "args": { "External id": 23560,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040675.605, "dur": 1.291, "args": { "External id": 23561,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040676.375, "dur": 0.447, "args": { "External id": 23562,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040677.158, "dur": 3.892, "args": { "External id": 23563,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040680.636, "dur": 0.285, "args": { "External id": 23564,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040681.324, "dur": 1.423, "args": { "External id": 23565,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040682.298, "dur": 0.378, "args": { "External id": 23566,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040683.032, "dur": 1.398, "args": { "External id": 23567,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040684.097, "dur": 0.259, "args": { "External id": 23568,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040684.680, "dur": 3.411, "args": { "External id": 23569,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040687.625, "dur": 0.392, "args": { "External id": 23570,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040688.509, "dur": 1.328, "args": { "External id": 23571,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040689.465, "dur": 0.300, "args": { "External id": 23572,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040690.111, "dur": 3.438, "args": { "External id": 23573,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040691.017, "dur": 2.457, "args": { "External id": 23574,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040695.923, "dur": 1.066, "args": { "External id": 23575,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040696.522, "dur": 0.401, "args": { "External id": 23576,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040697.236, "dur": 0.927, "args": { "External id": 23577,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040697.759, "dur": 0.332, "args": { "External id": 23578,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040698.416, "dur": 3.285, "args": { "External id": 23579,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040701.215, "dur": 0.415, "args": { "External id": 23580,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040701.977, "dur": 1.436, "args": { "External id": 23581,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040702.918, "dur": 0.423, "args": { "External id": 23582,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040703.921, "dur": 1.079, "args": { "External id": 23583,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040704.487, "dur": 0.444, "args": { "External id": 23584,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040705.550, "dur": 2.717, "args": { "External id": 23585,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040707.956, "dur": 0.236, "args": { "External id": 23586,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040708.517, "dur": 0.816, "args": { "External id": 23587,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040708.982, "dur": 0.241, "args": { "External id": 23588,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040709.583, "dur": 3.293, "args": { "External id": 23589,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040710.031, "dur": 2.545, "args": { "External id": 23590,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040715.084, "dur": 0.765, "args": { "External id": 23591,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040715.511, "dur": 0.265, "args": { "External id": 23592,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040716.101, "dur": 0.855, "args": { "External id": 23593,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040716.636, "dur": 0.248, "args": { "External id": 23594,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040717.402, "dur": 2.890, "args": { "External id": 23595,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040719.971, "dur": 0.250, "args": { "External id": 23596,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040720.567, "dur": 0.747, "args": { "External id": 23597,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040720.996, "dur": 0.246, "args": { "External id": 23598,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040721.565, "dur": 0.950, "args": { "External id": 23599,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040722.035, "dur": 0.408, "args": { "External id": 23600,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040722.765, "dur": 3.052, "args": { "External id": 23601,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040725.369, "dur": 0.378, "args": { "External id": 23602,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040726.069, "dur": 0.774, "args": { "External id": 23603,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040726.511, "dur": 0.264, "args": { "External id": 23604,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040727.095, "dur": 3.127, "args": { "External id": 23605,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040727.718, "dur": 2.243, "args": { "External id": 23606,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040732.674, "dur": 1.092, "args": { "External id": 23607,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040733.155, "dur": 0.537, "args": { "External id": 23608,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040734.194, "dur": 1.014, "args": { "External id": 23609,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040734.661, "dur": 0.473, "args": { "External id": 23610,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040735.461, "dur": 2.915, "args": { "External id": 23611,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040738.096, "dur": 0.206, "args": { "External id": 23612,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040738.647, "dur": 0.873, "args": { "External id": 23613,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040739.067, "dur": 0.382, "args": { "External id": 23614,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040739.771, "dur": 0.920, "args": { "External id": 23615,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040740.365, "dur": 0.255, "args": { "External id": 23616,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040740.943, "dur": 3.216, "args": { "External id": 23617,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040743.830, "dur": 0.257, "args": { "External id": 23618,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040744.601, "dur": 0.759, "args": { "External id": 23619,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040745.088, "dur": 0.204, "args": { "External id": 23620,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040745.614, "dur": 3.015, "args": { "External id": 23621,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040746.159, "dur": 2.210, "args": { "External id": 23622,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040750.920, "dur": 0.888, "args": { "External id": 23623,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040751.480, "dur": 0.260, "args": { "External id": 23624,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040752.063, "dur": 0.966, "args": { "External id": 23625,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040752.651, "dur": 0.307, "args": { "External id": 23626,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040753.490, "dur": 2.997, "args": { "External id": 23627,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040756.198, "dur": 0.220, "args": { "External id": 23628,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040756.807, "dur": 0.982, "args": { "External id": 23629,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040757.236, "dur": 0.479, "args": { "External id": 23630,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040758.047, "dur": 0.828, "args": { "External id": 23631,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040758.472, "dur": 0.330, "args": { "External id": 23632,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040759.320, "dur": 2.700, "args": { "External id": 23633,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040761.715, "dur": 0.236, "args": { "External id": 23634,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040762.646, "dur": 0.897, "args": { "External id": 23635,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040763.199, "dur": 0.274, "args": { "External id": 23636,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040763.793, "dur": 2.993, "args": { "External id": 23637,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040764.218, "dur": 2.491, "args": { "External id": 23638,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040769.051, "dur": 0.751, "args": { "External id": 23639,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040769.526, "dur": 0.207, "args": { "External id": 23640,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040770.053, "dur": 0.917, "args": { "External id": 23641,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040770.466, "dur": 0.429, "args": { "External id": 23642,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040771.391, "dur": 2.980, "args": { "External id": 23643,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040773.998, "dur": 0.301, "args": { "External id": 23644,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040774.663, "dur": 0.904, "args": { "External id": 23645,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040775.159, "dur": 0.333, "args": { "External id": 23646,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040775.818, "dur": 0.867, "args": { "External id": 23647,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040776.297, "dur": 0.314, "args": { "External id": 23648,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040777.136, "dur": 3.135, "args": { "External id": 23649,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040779.787, "dur": 0.411, "args": { "External id": 23650,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040780.547, "dur": 0.731, "args": { "External id": 23651,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040780.991, "dur": 0.215, "args": { "External id": 23652,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040781.839, "dur": 2.905, "args": { "External id": 23653,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040782.292, "dur": 2.380, "args": { "External id": 23654,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040787.030, "dur": 0.803, "args": { "External id": 23655,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040787.547, "dur": 0.210, "args": { "External id": 23656,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040788.112, "dur": 0.899, "args": { "External id": 23657,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040788.557, "dur": 0.382, "args": { "External id": 23658,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040789.268, "dur": 3.228, "args": { "External id": 23659,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040792.165, "dur": 0.258, "args": { "External id": 23660,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040792.771, "dur": 0.833, "args": { "External id": 23661,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040793.260, "dur": 0.273, "args": { "External id": 23662,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040794.049, "dur": 0.858, "args": { "External id": 23663,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040794.555, "dur": 0.278, "args": { "External id": 23664,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040795.365, "dur": 3.186, "args": { "External id": 23665,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040798.149, "dur": 0.325, "args": { "External id": 23666,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040799.013, "dur": 0.978, "args": { "External id": 23667,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040799.493, "dur": 0.423, "args": { "External id": 23668,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040800.244, "dur": 2.717, "args": { "External id": 23669,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040800.763, "dur": 2.123, "args": { "External id": 23670,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040804.991, "dur": 0.989, "args": { "External id": 23671,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040805.698, "dur": 0.214, "args": { "External id": 23672,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040806.433, "dur": 0.962, "args": { "External id": 23673,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040806.993, "dur": 0.331, "args": { "External id": 23674,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040807.826, "dur": 2.803, "args": { "External id": 23675,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040810.250, "dur": 0.308, "args": { "External id": 23676,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040810.904, "dur": 0.733, "args": { "External id": 23677,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040811.350, "dur": 0.219, "args": { "External id": 23678,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040811.887, "dur": 0.732, "args": { "External id": 23679,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040812.293, "dur": 0.256, "args": { "External id": 23680,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040812.870, "dur": 2.759, "args": { "External id": 23681,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040815.323, "dur": 0.235, "args": { "External id": 23682,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040815.890, "dur": 2.287, "args": { "External id": 23683,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040817.849, "dur": 0.255, "args": { "External id": 23684,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040818.680, "dur": 2.651, "args": { "External id": 23685,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040819.136, "dur": 2.117, "args": { "External id": 23686,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040823.587, "dur": 0.863, "args": { "External id": 23687,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040824.006, "dur": 0.376, "args": { "External id": 23688,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040824.699, "dur": 0.805, "args": { "External id": 23689,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040825.130, "dur": 0.301, "args": { "External id": 23690,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040825.770, "dur": 2.651, "args": { "External id": 23691,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040828.069, "dur": 0.277, "args": { "External id": 23692,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040828.696, "dur": 0.865, "args": { "External id": 23693,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040829.119, "dur": 0.368, "args": { "External id": 23694,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040829.811, "dur": 1.208, "args": { "External id": 23695,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040830.477, "dur": 0.472, "args": { "External id": 23696,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040831.275, "dur": 2.812, "args": { "External id": 23697,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040833.755, "dur": 0.262, "args": { "External id": 23698,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040834.545, "dur": 0.785, "args": { "External id": 23699,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040834.997, "dur": 0.263, "args": { "External id": 23700,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040835.777, "dur": 2.954, "args": { "External id": 23701,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040836.220, "dur": 2.433, "args": { "External id": 23702,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040840.832, "dur": 0.736, "args": { "External id": 23703,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040841.278, "dur": 0.219, "args": { "External id": 23704,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040841.818, "dur": 0.938, "args": { "External id": 23705,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040842.235, "dur": 0.448, "args": { "External id": 23706,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040843.007, "dur": 2.675, "args": { "External id": 23707,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040845.374, "dur": 0.243, "args": { "External id": 23708,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040845.955, "dur": 0.984, "args": { "External id": 23709,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040846.392, "dur": 0.476, "args": { "External id": 23710,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040847.375, "dur": 0.761, "args": { "External id": 23711,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040847.799, "dur": 0.268, "args": { "External id": 23712,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040848.397, "dur": 2.998, "args": { "External id": 23713,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040851.087, "dur": 0.237, "args": { "External id": 23714,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040851.828, "dur": 0.776, "args": { "External id": 23715,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040852.304, "dur": 0.229, "args": { "External id": 23716,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040852.854, "dur": 2.747, "args": { "External id": 23717,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040853.285, "dur": 2.243, "args": { "External id": 23718,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040857.729, "dur": 0.872, "args": { "External id": 23719,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040858.171, "dur": 0.357, "args": { "External id": 23720,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040858.851, "dur": 1.075, "args": { "External id": 23721,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040859.509, "dur": 0.344, "args": { "External id": 23722,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040860.194, "dur": 3.377, "args": { "External id": 23723,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040863.114, "dur": 0.386, "args": { "External id": 23724,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040863.854, "dur": 1.103, "args": { "External id": 23725,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040864.287, "dur": 0.601, "args": { "External id": 23726,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040865.214, "dur": 1.542, "args": { "External id": 23727,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040866.285, "dur": 0.356, "args": { "External id": 23728,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040867.173, "dur": 2.847, "args": { "External id": 23729,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040869.686, "dur": 0.222, "args": { "External id": 23730,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040870.494, "dur": 0.961, "args": { "External id": 23731,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040871.142, "dur": 0.209, "args": { "External id": 23732,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040871.979, "dur": 2.791, "args": { "External id": 23733,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040872.453, "dur": 2.208, "args": { "External id": 23734,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040877.040, "dur": 1.054, "args": { "External id": 23735,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040877.599, "dur": 0.380, "args": { "External id": 23736,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040878.344, "dur": 0.899, "args": { "External id": 23737,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040878.783, "dur": 0.341, "args": { "External id": 23738,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040879.700, "dur": 2.720, "args": { "External id": 23739,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040882.042, "dur": 0.269, "args": { "External id": 23740,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040882.705, "dur": 0.819, "args": { "External id": 23741,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040883.198, "dur": 0.234, "args": { "External id": 23742,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040883.802, "dur": 0.789, "args": { "External id": 23743,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040884.214, "dur": 0.268, "args": { "External id": 23744,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040884.850, "dur": 2.383, "args": { "External id": 23745,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040886.886, "dur": 0.244, "args": { "External id": 23746,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040887.482, "dur": 0.879, "args": { "External id": 23747,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040888.104, "dur": 0.193, "args": { "External id": 23748,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040888.614, "dur": 3.033, "args": { "External id": 23749,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040889.041, "dur": 2.495, "args": { "External id": 23750,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040894.144, "dur": 1.535, "args": { "External id": 23751,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040894.587, "dur": 0.989, "args": { "External id": 23752,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040896.119, "dur": 2.020, "args": { "External id": 23753,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040896.944, "dur": 1.083, "args": { "External id": 23754,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040898.405, "dur": 3.139, "args": { "External id": 23755,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040900.863, "dur": 0.573, "args": { "External id": 23756,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040901.822, "dur": 1.089, "args": { "External id": 23757,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040902.230, "dur": 0.587, "args": { "External id": 23758,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040903.349, "dur": 1.204, "args": { "External id": 23759,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040903.756, "dur": 0.702, "args": { "External id": 23760,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040904.814, "dur": 3.024, "args": { "External id": 23761,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040906.938, "dur": 0.797, "args": { "External id": 23762,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040908.108, "dur": 1.346, "args": { "External id": 23763,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040908.742, "dur": 0.604, "args": { "External id": 23764,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040909.707, "dur": 3.014, "args": { "External id": 23765,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040910.346, "dur": 2.279, "args": { "External id": 23766,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040915.339, "dur": 1.485, "args": { "External id": 23767,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040915.929, "dur": 0.789, "args": { "External id": 23768,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040917.074, "dur": 1.564, "args": { "External id": 23769,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040917.479, "dur": 1.050, "args": { "External id": 23770,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040918.896, "dur": 3.478, "args": { "External id": 23771,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040921.382, "dur": 0.879, "args": { "External id": 23772,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040922.649, "dur": 1.325, "args": { "External id": 23773,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040923.256, "dur": 0.617, "args": { "External id": 23774,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040924.224, "dur": 1.461, "args": { "External id": 23775,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040924.797, "dur": 0.819, "args": { "External id": 23776,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040926.131, "dur": 3.342, "args": { "External id": 23777,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040928.404, "dur": 0.959, "args": { "External id": 23778,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040929.905, "dur": 1.148, "args": { "External id": 23779,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040930.317, "dur": 0.630, "args": { "External id": 23780,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040931.310, "dur": 3.324, "args": { "External id": 23781,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040931.890, "dur": 2.667, "args": { "External id": 23782,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040936.903, "dur": 1.077, "args": { "External id": 23783,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040937.312, "dur": 0.564, "args": { "External id": 23784,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040938.230, "dur": 1.253, "args": { "External id": 23785,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040938.674, "dur": 0.697, "args": { "External id": 23786,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040939.736, "dur": 3.467, "args": { "External id": 23787,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040942.311, "dur": 0.784, "args": { "External id": 23788,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040943.511, "dur": 1.366, "args": { "External id": 23789,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040943.922, "dur": 0.861, "args": { "External id": 23790,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040945.128, "dur": 1.115, "args": { "External id": 23791,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040945.529, "dur": 0.643, "args": { "External id": 23792,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040946.494, "dur": 3.296, "args": { "External id": 23793,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040948.909, "dur": 0.776, "args": { "External id": 23794,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040950.085, "dur": 0.910, "args": { "External id": 23795,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040950.495, "dur": 0.396, "args": { "External id": 23796,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040951.440, "dur": 2.808, "args": { "External id": 23797,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040951.834, "dur": 2.315, "args": { "External id": 23798,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040956.165, "dur": 1.508, "args": { "External id": 23799,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040956.952, "dur": 0.620, "args": { "External id": 23800,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040958.102, "dur": 1.780, "args": { "External id": 23801,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040958.709, "dur": 1.065, "args": { "External id": 23802,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040960.148, "dur": 3.807, "args": { "External id": 23803,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040963.133, "dur": 0.717, "args": { "External id": 23804,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040964.228, "dur": 1.627, "args": { "External id": 23805,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040964.903, "dur": 0.858, "args": { "External id": 23806,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040966.114, "dur": 1.422, "args": { "External id": 23807,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040966.735, "dur": 0.733, "args": { "External id": 23808,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040967.788, "dur": 3.180, "args": { "External id": 23809,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040970.051, "dur": 0.810, "args": { "External id": 23810,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040971.219, "dur": 1.002, "args": { "External id": 23811,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040971.712, "dur": 0.443, "args": { "External id": 23812,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040972.505, "dur": 2.633, "args": { "External id": 23813,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040972.949, "dur": 2.074, "args": { "External id": 23814,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040977.239, "dur": 1.584, "args": { "External id": 23815,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040977.956, "dur": 0.765, "args": { "External id": 23816,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040979.074, "dur": 1.289, "args": { "External id": 23817,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652040979.658, "dur": 0.635, "args": { "External id": 23818,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652040980.614, "dur": 29.562, "args": { "External id": 23819,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041008.176, "dur": 1.153, "args": { "External id": 23820,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041011.277, "dur": 1.644, "args": { "External id": 23821,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041012.426, "dur": 0.432, "args": { "External id": 23822,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041013.238, "dur": 1.390, "args": { "External id": 23823,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041013.687, "dur": 0.839, "args": { "External id": 23824,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041014.900, "dur": 3.285, "args": { "External id": 23825,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041017.199, "dur": 0.923, "args": { "External id": 23826,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041018.453, "dur": 1.578, "args": { "External id": 23827,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041019.072, "dur": 0.869, "args": { "External id": 23828,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041020.469, "dur": 2.760, "args": { "External id": 23829,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041021.156, "dur": 1.997, "args": { "External id": 23830,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041025.335, "dur": 1.420, "args": { "External id": 23831,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041025.973, "dur": 0.692, "args": { "External id": 23832,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041027.041, "dur": 2.010, "args": { "External id": 23833,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041028.218, "dur": 0.739, "args": { "External id": 23834,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041029.399, "dur": 2.992, "args": { "External id": 23835,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041031.740, "dur": 0.587, "args": { "External id": 23836,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041032.692, "dur": 1.542, "args": { "External id": 23837,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041033.573, "dur": 0.574, "args": { "External id": 23838,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041034.512, "dur": 1.190, "args": { "External id": 23839,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041034.927, "dur": 0.680, "args": { "External id": 23840,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041035.936, "dur": 2.858, "args": { "External id": 23841,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041038.111, "dur": 0.598, "args": { "External id": 23842,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041039.107, "dur": 1.122, "args": { "External id": 23843,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041039.531, "dur": 0.613, "args": { "External id": 23844,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041040.463, "dur": 2.968, "args": { "External id": 23845,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041041.113, "dur": 2.220, "args": { "External id": 23846,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041045.574, "dur": 1.341, "args": { "External id": 23847,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041046.129, "dur": 0.698, "args": { "External id": 23848,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041047.451, "dur": 1.833, "args": { "External id": 23849,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041048.346, "dur": 0.845, "args": { "External id": 23850,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041049.589, "dur": 2.871, "args": { "External id": 23851,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041051.781, "dur": 0.592, "args": { "External id": 23852,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041052.706, "dur": 1.625, "args": { "External id": 23853,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041053.536, "dur": 0.707, "args": { "External id": 23854,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041054.663, "dur": 1.257, "args": { "External id": 23855,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041055.091, "dur": 0.740, "args": { "External id": 23856,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041056.181, "dur": 3.552, "args": { "External id": 23857,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041059.025, "dur": 0.616, "args": { "External id": 23858,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041060.190, "dur": 1.336, "args": { "External id": 23859,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041060.835, "dur": 0.604, "args": { "External id": 23860,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041061.760, "dur": 3.877, "args": { "External id": 23861,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041062.940, "dur": 2.408, "args": { "External id": 23862,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041068.184, "dur": 1.182, "args": { "External id": 23863,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041068.704, "dur": 0.572, "args": { "External id": 23864,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041069.836, "dur": 1.851, "args": { "External id": 23865,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041070.747, "dur": 0.869, "args": { "External id": 23866,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041072.136, "dur": 2.924, "args": { "External id": 23867,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041074.256, "dur": 0.717, "args": { "External id": 23868,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041075.308, "dur": 1.292, "args": { "External id": 23869,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041075.944, "dur": 0.591, "args": { "External id": 23870,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041076.859, "dur": 1.534, "args": { "External id": 23871,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041077.440, "dur": 0.884, "args": { "External id": 23872,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041078.800, "dur": 3.522, "args": { "External id": 23873,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041081.478, "dur": 0.779, "args": { "External id": 23874,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041082.637, "dur": 1.136, "args": { "External id": 23875,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041083.062, "dur": 0.624, "args": { "External id": 23876,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041084.200, "dur": 3.101, "args": { "External id": 23877,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041085.070, "dur": 2.150, "args": { "External id": 23878,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041089.628, "dur": 1.337, "args": { "External id": 23879,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041090.267, "dur": 0.625, "args": { "External id": 23880,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041091.199, "dur": 1.395, "args": { "External id": 23881,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041091.878, "dur": 0.648, "args": { "External id": 23882,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041092.864, "dur": 2.789, "args": { "External id": 23883,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041095.157, "dur": 0.400, "args": { "External id": 23884,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041095.906, "dur": 1.749, "args": { "External id": 23885,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041097.021, "dur": 0.565, "args": { "External id": 23886,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041098.115, "dur": 1.325, "args": { "External id": 23887,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041098.716, "dur": 0.652, "args": { "External id": 23888,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041099.874, "dur": 3.693, "args": { "External id": 23889,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041102.675, "dur": 0.825, "args": { "External id": 23890,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041103.838, "dur": 0.906, "args": { "External id": 23891,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041104.269, "dur": 0.386, "args": { "External id": 23892,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041105.060, "dur": 2.737, "args": { "External id": 23893,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041105.746, "dur": 1.978, "args": { "External id": 23894,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041110.087, "dur": 1.250, "args": { "External id": 23895,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041110.742, "dur": 0.521, "args": { "External id": 23896,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041111.587, "dur": 1.600, "args": { "External id": 23897,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041112.653, "dur": 0.461, "args": { "External id": 23898,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041113.637, "dur": 3.144, "args": { "External id": 23899,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041116.309, "dur": 0.408, "args": { "External id": 23900,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041117.029, "dur": 1.453, "args": { "External id": 23901,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041117.904, "dur": 0.493, "args": { "External id": 23902,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041118.937, "dur": 1.049, "args": { "External id": 23903,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041119.351, "dur": 0.542, "args": { "External id": 23904,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041120.239, "dur": 3.753, "args": { "External id": 23905,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041123.339, "dur": 0.584, "args": { "External id": 23906,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041124.272, "dur": 1.350, "args": { "External id": 23907,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041124.679, "dur": 0.880, "args": { "External id": 23908,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041125.859, "dur": 3.440, "args": { "External id": 23909,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041127.028, "dur": 2.176, "args": { "External id": 23910,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041131.417, "dur": 1.341, "args": { "External id": 23911,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041132.071, "dur": 0.626, "args": { "External id": 23912,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041133.339, "dur": 1.585, "args": { "External id": 23913,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041134.132, "dur": 0.721, "args": { "External id": 23914,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041135.179, "dur": 3.414, "args": { "External id": 23915,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041137.806, "dur": 0.698, "args": { "External id": 23916,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041138.908, "dur": 1.936, "args": { "External id": 23917,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041139.855, "dur": 0.920, "args": { "External id": 23918,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041141.135, "dur": 1.903, "args": { "External id": 23919,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041141.797, "dur": 1.148, "args": { "External id": 23920,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041143.489, "dur": 3.644, "args": { "External id": 23921,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041146.467, "dur": 0.593, "args": { "External id": 23922,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041147.564, "dur": 1.440, "args": { "External id": 23923,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041148.202, "dur": 0.714, "args": { "External id": 23924,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041149.444, "dur": 3.360, "args": { "External id": 23925,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041150.625, "dur": 2.082, "args": { "External id": 23926,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041154.965, "dur": 1.441, "args": { "External id": 23927,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041155.598, "dur": 0.721, "args": { "External id": 23928,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041156.886, "dur": 1.713, "args": { "External id": 23929,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041157.882, "dur": 0.649, "args": { "External id": 23930,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041159.037, "dur": 2.986, "args": { "External id": 23931,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041161.177, "dur": 0.750, "args": { "External id": 23932,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041162.297, "dur": 1.747, "args": { "External id": 23933,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041163.144, "dur": 0.840, "args": { "External id": 23934,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041164.299, "dur": 1.238, "args": { "External id": 23935,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041164.757, "dur": 0.687, "args": { "External id": 23936,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041165.793, "dur": 3.729, "args": { "External id": 23937,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041168.797, "dur": 0.636, "args": { "External id": 23938,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336757, "tid": 1336757, "ts": 1295652041169.791, "dur": 2.832, "args": { "External id": 23939,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041171.879, "dur": 0.657, "args": { "External id": 23940,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::cat", "pid": 1336757, "tid": 1336757, "ts": 1295652041191.738, "dur": 175.307, "args": { "External id": 23941,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linalg_vector_norm", "pid": 1336757, "tid": 1336757, "ts": 1295652041483.777, "dur": 140.123, "args": { "External id": 23942,"Record function id": 0, "Concrete Inputs": ["", "2.", "", "False", ""], "Input type": ["float", "Scalar", "", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[291], [], [], [], []], "Ev Idx": 11293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linalg_vector_norm", "pid": 1336757, "tid": 1336757, "ts": 1295652041550.241, "dur": 52.846, "args": { "External id": 23943,"Record function id": 0, "Concrete Inputs": ["", "2.", "", "False", ""], "Input type": ["float", "Scalar", "", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[291], [], [], [], []], "Ev Idx": 11294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336757, "tid": 1336757, "ts": 1295652041567.456, "dur": 1.527, "args": { "External id": 23944,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11295 } }, { "ph": "X", "cat": "cpu_op", "name": "Redistribute", "pid": 1336757, "tid": 1336757, "ts": 1295652042055.776, "dur": 1033.545, "args": { "External id": 23945,"Sequence number": 246776, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "False"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 1336757, "tid": 1336757, "ts": 1295652042114.075, "dur": 111.819, "args": { "External id": 23946,"Record function id": 0, "Concrete Inputs": ["", "2."], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652042118.286, "dur": 1.699, "args": { "External id": 23947,"Record function id": 0, "Concrete Inputs": ["", "2."], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652042174.655, "dur": 0.724, "args": { "External id": 23948,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 11299 } }, { "ph": "X", "cat": "cpu_op", "name": "_c10d_functional::all_reduce", "pid": 1336757, "tid": 1336757, "ts": 1295652042272.198, "dur": 458.851, "args": { "External id": 23949,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["float", "", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336757, "tid": 1336757, "ts": 1295652042276.291, "dur": 64.843, "args": { "External id": 23950,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336757, "tid": 1336757, "ts": 1295652042280.661, "dur": 16.210, "args": { "External id": 23951,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "0"], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 11302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295652042288.079, "dur": 7.646, "args": { "External id": 23952,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 11303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336757, "tid": 1336757, "ts": 1295652042298.820, "dur": 41.404, "args": { "External id": 23953,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11304 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::allreduce_", "pid": 1336757, "tid": 1336757, "ts": 1295652042352.875, "dur": 374.782, "args": { "External id": 23954,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "-1"], "Input type": ["TensorList", "", "", "", "Scalar"], "Input Strides": [[[]], [], [], [], []], "Input Dims": [[[]], [], [], [], []], "Ev Idx": 11305 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295652042386.687, "dur": 334.492, "args": { "External id": 23955,"Record function id": 0, "Collective name": "allreduce", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 4, "Input Strides": [[[]], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "4", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1, "Process Group Name": "0", "Input type": ["TensorList", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[[]], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 11306, "In msg nelems": 1 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:all_reduce", "pid": 1336757, "tid": 1336757, "ts": 1295652042405.249, "dur": 310.803, "args": { "External id": 23956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 1336757, "tid": 1336757, "ts": 1295652042800.204, "dur": 248.783, "args": { "External id": 23957,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11308 } }, { "ph": "X", "cat": "cpu_op", "name": "_c10d_functional::wait_tensor", "pid": 1336757, "tid": 1336757, "ts": 1295652042896.197, "dur": 32.858, "args": { "External id": 23958,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11309 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336757, "tid": 1336757, "ts": 1295652042915.818, "dur": 4.312, "args": { "External id": 23959,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "4", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 11310, "In msg nelems": 0, "Rank": 4, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 1336757, "tid": 1336757, "ts": 1295652042958.954, "dur": 82.203, "args": { "External id": 23960,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652042961.793, "dur": 1.376, "args": { "External id": 23961,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652042964.511, "dur": 0.685, "args": { "External id": 23962,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 11313 } }, { "ph": "X", "cat": "cpu_op", "name": "_ToTorchTensor", "pid": 1336757, "tid": 1336757, "ts": 1295652043108.538, "dur": 23.720, "args": { "External id": 23963,"Sequence number": 246777, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336757, "tid": 1336757, "ts": 1295652043119.942, "dur": 8.780, "args": { "External id": 23964,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336757, "tid": 1336757, "ts": 1295652043122.928, "dur": 5.550, "args": { "External id": 23965,"Record function id": 0, "Concrete Inputs": ["", "[]"], "Input type": ["float", "ScalarList"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336757, "tid": 1336757, "ts": 1295652043528.535, "dur": 46.222, "args": { "External id": 23966,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "double", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reciprocal", "pid": 1336757, "tid": 1336757, "ts": 1295652043585.394, "dur": 23.967, "args": { "External id": 23967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mul", "pid": 1336757, "tid": 1336757, "ts": 1295652043616.701, "dur": 23.853, "args": { "External id": 23968,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "double"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clamp", "pid": 1336757, "tid": 1336757, "ts": 1295652043653.583, "dur": 34.717, "args": { "External id": 23969,"Record function id": 0, "Concrete Inputs": ["", "", "1."], "Input type": ["float", "", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652043656.944, "dur": 0.866, "args": { "External id": 23970,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 11321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336757, "tid": 1336757, "ts": 1295652043711.095, "dur": 0.502, "args": { "External id": 23971,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 11322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_mul_", "pid": 1336757, "tid": 1336757, "ts": 1295652043825.087, "dur": 894.356, "args": { "External id": 23972,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["TensorList", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_mul_", "pid": 1336757, "tid": 1336757, "ts": 1295652044401.224, "dur": 284.369, "args": { "External id": 23973,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["TensorList", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::isnan", "pid": 1336757, "tid": 1336757, "ts": 1295652044769.260, "dur": 31.395, "args": { "External id": 23974,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336757, "tid": 1336757, "ts": 1295652044772.819, "dur": 27.276, "args": { "External id": 23975,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336757, "tid": 1336757, "ts": 1295652044804.754, "dur": 222.179, "args": { "External id": 23976,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336757, "tid": 1336757, "ts": 1295652044806.437, "dur": 220.247, "args": { "External id": 23977,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336757, "tid": 1336757, "ts": 1295652044808.457, "dur": 217.410, "args": { "External id": 23978,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::isinf", "pid": 1336757, "tid": 1336757, "ts": 1295652045033.761, "dur": 66.665, "args": { "External id": 23979,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295652045036.687, "dur": 38.926, "args": { "External id": 23980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336757, "tid": 1336757, "ts": 1295652045045.172, "dur": 3.692, "args": { "External id": 23981,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 11332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336757, "tid": 1336757, "ts": 1295652045051.033, "dur": 24.237, "args": { "External id": 23982,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], [1]], "Input Dims": [[], [0]], "Ev Idx": 11333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336757, "tid": 1336757, "ts": 1295652045056.414, "dur": 3.330, "args": { "External id": 23983,"Record function id": 0, "Concrete Inputs": ["", "[]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 11334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336757, "tid": 1336757, "ts": 1295652045077.543, "dur": 22.135, "args": { "External id": 23984,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336757, "tid": 1336757, "ts": 1295652045103.274, "dur": 36.876, "args": { "External id": 23985,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336757, "tid": 1336757, "ts": 1295652045106.856, "dur": 33.030, "args": { "External id": 23986,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336757, "tid": 1336757, "ts": 1295652045107.907, "dur": 31.679, "args": { "External id": 23987,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11338 } }, { "ph": "X", "cat": "user_annotation", "name": "Optimizer.step#OptimizersContainer.step", "pid": 1336757, "tid": 1336757, "ts": 1295652045173.907, "dur": 6273.954, "args": { "External id": 23988,"Record function id": 0, "Ev Idx": 11339 } }, { "ph": "X", "cat": "user_annotation", "name": "Optimizer.step#AdamW.step", "pid": 1336757, "tid": 1336757, "ts": 1295652045207.327, "dur": 6217.452, "args": { "External id": 23989,"Record function id": 0, "Ev Idx": 11340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_add_", "pid": 1336757, "tid": 1336757, "ts": 1295652046618.276, "dur": 297.944, "args": { "External id": 23990,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046639.750, "dur": 1.491, "args": { "External id": 23991,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046642.702, "dur": 0.074, "args": { "External id": 23992,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046643.174, "dur": 0.294, "args": { "External id": 23993,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046644.006, "dur": 0.373, "args": { "External id": 23994,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046644.721, "dur": 0.200, "args": { "External id": 23995,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046645.301, "dur": 0.199, "args": { "External id": 23996,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046645.897, "dur": 0.291, "args": { "External id": 23997,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046646.554, "dur": 0.248, "args": { "External id": 23998,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046647.707, "dur": 0.280, "args": { "External id": 23999,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046648.362, "dur": 0.267, "args": { "External id": 24000,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046649.009, "dur": 0.272, "args": { "External id": 24001,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046649.626, "dur": 0.063, "args": { "External id": 24002,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046650.236, "dur": 0.067, "args": { "External id": 24003,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046650.706, "dur": 0.066, "args": { "External id": 24004,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046651.256, "dur": 0.247, "args": { "External id": 24005,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046651.859, "dur": 0.280, "args": { "External id": 24006,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046652.577, "dur": 0.075, "args": { "External id": 24007,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046653.015, "dur": 0.072, "args": { "External id": 24008,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046653.432, "dur": 0.105, "args": { "External id": 24009,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046653.955, "dur": 0.097, "args": { "External id": 24010,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046654.416, "dur": 0.058, "args": { "External id": 24011,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046654.819, "dur": 0.073, "args": { "External id": 24012,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046655.213, "dur": 0.066, "args": { "External id": 24013,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046655.538, "dur": 0.072, "args": { "External id": 24014,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046655.981, "dur": 0.080, "args": { "External id": 24015,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046656.450, "dur": 0.068, "args": { "External id": 24016,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046656.839, "dur": 0.054, "args": { "External id": 24017,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046657.214, "dur": 0.058, "args": { "External id": 24018,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046657.723, "dur": 0.064, "args": { "External id": 24019,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046658.186, "dur": 0.061, "args": { "External id": 24020,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046658.683, "dur": 0.062, "args": { "External id": 24021,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046659.087, "dur": 0.058, "args": { "External id": 24022,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046659.503, "dur": 0.081, "args": { "External id": 24023,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046659.933, "dur": 0.063, "args": { "External id": 24024,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046660.415, "dur": 0.063, "args": { "External id": 24025,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046660.956, "dur": 0.065, "args": { "External id": 24026,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046661.452, "dur": 0.068, "args": { "External id": 24027,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046661.865, "dur": 0.063, "args": { "External id": 24028,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046662.260, "dur": 0.063, "args": { "External id": 24029,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046662.678, "dur": 0.061, "args": { "External id": 24030,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046663.101, "dur": 0.068, "args": { "External id": 24031,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046663.573, "dur": 0.053, "args": { "External id": 24032,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046663.929, "dur": 0.063, "args": { "External id": 24033,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046664.308, "dur": 0.068, "args": { "External id": 24034,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046664.747, "dur": 0.064, "args": { "External id": 24035,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046665.204, "dur": 0.062, "args": { "External id": 24036,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046665.682, "dur": 0.064, "args": { "External id": 24037,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046666.097, "dur": 0.059, "args": { "External id": 24038,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046666.463, "dur": 0.293, "args": { "External id": 24039,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046667.066, "dur": 0.266, "args": { "External id": 24040,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046667.906, "dur": 0.087, "args": { "External id": 24041,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046668.466, "dur": 0.317, "args": { "External id": 24042,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046669.143, "dur": 0.063, "args": { "External id": 24043,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046669.816, "dur": 0.256, "args": { "External id": 24044,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046670.702, "dur": 0.050, "args": { "External id": 24045,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046671.040, "dur": 0.063, "args": { "External id": 24046,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046671.452, "dur": 0.057, "args": { "External id": 24047,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046671.890, "dur": 0.062, "args": { "External id": 24048,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046672.931, "dur": 0.052, "args": { "External id": 24049,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046673.466, "dur": 0.068, "args": { "External id": 24050,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046674.370, "dur": 0.069, "args": { "External id": 24051,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046674.825, "dur": 0.063, "args": { "External id": 24052,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046675.659, "dur": 0.062, "args": { "External id": 24053,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046675.972, "dur": 0.047, "args": { "External id": 24054,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046676.714, "dur": 0.053, "args": { "External id": 24055,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046677.019, "dur": 0.050, "args": { "External id": 24056,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046677.772, "dur": 0.064, "args": { "External id": 24057,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046678.092, "dur": 0.064, "args": { "External id": 24058,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046678.978, "dur": 0.052, "args": { "External id": 24059,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046679.274, "dur": 0.050, "args": { "External id": 24060,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046679.876, "dur": 0.063, "args": { "External id": 24061,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046680.189, "dur": 0.048, "args": { "External id": 24062,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046680.985, "dur": 0.062, "args": { "External id": 24063,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046681.298, "dur": 0.046, "args": { "External id": 24064,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046710.151, "dur": 0.090, "args": { "External id": 24065,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046710.576, "dur": 0.050, "args": { "External id": 24066,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046711.355, "dur": 0.054, "args": { "External id": 24067,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046711.672, "dur": 0.052, "args": { "External id": 24068,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046712.459, "dur": 0.066, "args": { "External id": 24069,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046712.767, "dur": 0.054, "args": { "External id": 24070,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046713.587, "dur": 0.063, "args": { "External id": 24071,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046713.898, "dur": 0.052, "args": { "External id": 24072,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046714.499, "dur": 0.065, "args": { "External id": 24073,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046714.961, "dur": 0.051, "args": { "External id": 24074,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046715.617, "dur": 0.064, "args": { "External id": 24075,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046716.225, "dur": 0.060, "args": { "External id": 24076,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046716.877, "dur": 0.059, "args": { "External id": 24077,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046717.187, "dur": 0.050, "args": { "External id": 24078,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046717.897, "dur": 0.066, "args": { "External id": 24079,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046718.370, "dur": 0.057, "args": { "External id": 24080,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046718.970, "dur": 0.066, "args": { "External id": 24081,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046719.283, "dur": 0.052, "args": { "External id": 24082,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046719.823, "dur": 0.064, "args": { "External id": 24083,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046720.142, "dur": 0.052, "args": { "External id": 24084,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046720.764, "dur": 0.065, "args": { "External id": 24085,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046721.076, "dur": 0.048, "args": { "External id": 24086,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046721.885, "dur": 0.065, "args": { "External id": 24087,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046722.196, "dur": 0.054, "args": { "External id": 24088,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046723.003, "dur": 0.065, "args": { "External id": 24089,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046723.314, "dur": 0.049, "args": { "External id": 24090,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046724.127, "dur": 0.066, "args": { "External id": 24091,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046724.436, "dur": 0.055, "args": { "External id": 24092,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046725.249, "dur": 0.069, "args": { "External id": 24093,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046725.591, "dur": 0.050, "args": { "External id": 24094,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046726.430, "dur": 0.066, "args": { "External id": 24095,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046726.746, "dur": 0.050, "args": { "External id": 24096,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046727.528, "dur": 0.064, "args": { "External id": 24097,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046727.847, "dur": 0.049, "args": { "External id": 24098,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046728.539, "dur": 0.066, "args": { "External id": 24099,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046728.889, "dur": 0.047, "args": { "External id": 24100,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046729.710, "dur": 0.060, "args": { "External id": 24101,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046730.026, "dur": 0.050, "args": { "External id": 24102,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046730.625, "dur": 0.056, "args": { "External id": 24103,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046730.928, "dur": 0.050, "args": { "External id": 24104,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046731.558, "dur": 0.063, "args": { "External id": 24105,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046731.862, "dur": 0.054, "args": { "External id": 24106,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046732.576, "dur": 0.055, "args": { "External id": 24107,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046732.872, "dur": 0.049, "args": { "External id": 24108,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046733.525, "dur": 0.062, "args": { "External id": 24109,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046733.854, "dur": 0.049, "args": { "External id": 24110,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046734.656, "dur": 0.066, "args": { "External id": 24111,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046734.965, "dur": 0.049, "args": { "External id": 24112,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046735.596, "dur": 0.057, "args": { "External id": 24113,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046735.896, "dur": 0.048, "args": { "External id": 24114,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046736.438, "dur": 0.053, "args": { "External id": 24115,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046736.738, "dur": 0.047, "args": { "External id": 24116,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046737.282, "dur": 0.064, "args": { "External id": 24117,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046743.951, "dur": 0.082, "args": { "External id": 24118,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046744.672, "dur": 0.063, "args": { "External id": 24119,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046744.976, "dur": 0.048, "args": { "External id": 24120,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046745.741, "dur": 0.054, "args": { "External id": 24121,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046746.041, "dur": 0.048, "args": { "External id": 24122,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046746.849, "dur": 0.062, "args": { "External id": 24123,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046747.158, "dur": 0.049, "args": { "External id": 24124,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046747.865, "dur": 0.068, "args": { "External id": 24125,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046748.214, "dur": 0.051, "args": { "External id": 24126,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046749.006, "dur": 0.057, "args": { "External id": 24127,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046749.309, "dur": 0.047, "args": { "External id": 24128,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046749.922, "dur": 0.060, "args": { "External id": 24129,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046750.222, "dur": 0.049, "args": { "External id": 24130,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046750.994, "dur": 0.067, "args": { "External id": 24131,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046751.305, "dur": 0.050, "args": { "External id": 24132,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046751.868, "dur": 0.052, "args": { "External id": 24133,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046752.168, "dur": 0.053, "args": { "External id": 24134,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046752.905, "dur": 0.063, "args": { "External id": 24135,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046753.211, "dur": 0.051, "args": { "External id": 24136,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046754.067, "dur": 0.055, "args": { "External id": 24137,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046754.374, "dur": 0.056, "args": { "External id": 24138,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046755.005, "dur": 0.064, "args": { "External id": 24139,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046755.306, "dur": 0.059, "args": { "External id": 24140,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046755.851, "dur": 0.066, "args": { "External id": 24141,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046756.163, "dur": 0.054, "args": { "External id": 24142,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046756.733, "dur": 0.068, "args": { "External id": 24143,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046757.042, "dur": 0.052, "args": { "External id": 24144,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046757.791, "dur": 0.062, "args": { "External id": 24145,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046758.113, "dur": 0.051, "args": { "External id": 24146,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046758.988, "dur": 0.053, "args": { "External id": 24147,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046759.285, "dur": 0.054, "args": { "External id": 24148,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046760.125, "dur": 0.056, "args": { "External id": 24149,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046760.422, "dur": 0.050, "args": { "External id": 24150,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046761.183, "dur": 0.064, "args": { "External id": 24151,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046761.493, "dur": 0.049, "args": { "External id": 24152,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046762.261, "dur": 0.056, "args": { "External id": 24153,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046762.562, "dur": 0.059, "args": { "External id": 24154,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046763.095, "dur": 0.055, "args": { "External id": 24155,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046763.394, "dur": 0.051, "args": { "External id": 24156,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046764.044, "dur": 0.054, "args": { "External id": 24157,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046764.343, "dur": 0.049, "args": { "External id": 24158,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046765.162, "dur": 0.056, "args": { "External id": 24159,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046765.461, "dur": 0.053, "args": { "External id": 24160,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046766.052, "dur": 0.056, "args": { "External id": 24161,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046766.353, "dur": 0.047, "args": { "External id": 24162,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046767.288, "dur": 0.055, "args": { "External id": 24163,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046767.590, "dur": 0.052, "args": { "External id": 24164,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046768.509, "dur": 0.063, "args": { "External id": 24165,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046768.841, "dur": 0.049, "args": { "External id": 24166,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046769.445, "dur": 0.062, "args": { "External id": 24167,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046769.758, "dur": 0.050, "args": { "External id": 24168,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046770.706, "dur": 0.048, "args": { "External id": 24169,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046770.997, "dur": 0.050, "args": { "External id": 24170,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046771.672, "dur": 0.053, "args": { "External id": 24171,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046771.977, "dur": 0.052, "args": { "External id": 24172,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046772.745, "dur": 0.067, "args": { "External id": 24173,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046773.060, "dur": 0.047, "args": { "External id": 24174,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046773.759, "dur": 0.066, "args": { "External id": 24175,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046774.071, "dur": 0.047, "args": { "External id": 24176,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046774.645, "dur": 0.062, "args": { "External id": 24177,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046774.976, "dur": 0.046, "args": { "External id": 24178,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046775.493, "dur": 0.064, "args": { "External id": 24179,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046775.799, "dur": 0.056, "args": { "External id": 24180,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046776.368, "dur": 0.064, "args": { "External id": 24181,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046776.680, "dur": 0.047, "args": { "External id": 24182,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046777.282, "dur": 0.069, "args": { "External id": 24183,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046777.590, "dur": 0.047, "args": { "External id": 24184,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046778.141, "dur": 0.063, "args": { "External id": 24185,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046778.448, "dur": 0.052, "args": { "External id": 24186,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046779.085, "dur": 0.066, "args": { "External id": 24187,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046779.555, "dur": 0.066, "args": { "External id": 24188,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046780.175, "dur": 0.057, "args": { "External id": 24189,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046780.741, "dur": 0.065, "args": { "External id": 24190,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046781.359, "dur": 0.063, "args": { "External id": 24191,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046781.673, "dur": 0.047, "args": { "External id": 24192,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046782.237, "dur": 0.063, "args": { "External id": 24193,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046782.539, "dur": 0.052, "args": { "External id": 24194,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046783.598, "dur": 0.061, "args": { "External id": 24195,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046783.901, "dur": 0.050, "args": { "External id": 24196,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046784.737, "dur": 0.066, "args": { "External id": 24197,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046785.082, "dur": 0.060, "args": { "External id": 24198,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046785.873, "dur": 0.064, "args": { "External id": 24199,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046786.179, "dur": 0.051, "args": { "External id": 24200,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046786.746, "dur": 0.055, "args": { "External id": 24201,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046787.044, "dur": 0.056, "args": { "External id": 24202,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046787.895, "dur": 0.054, "args": { "External id": 24203,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046788.189, "dur": 0.055, "args": { "External id": 24204,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046789.022, "dur": 0.066, "args": { "External id": 24205,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046789.333, "dur": 0.058, "args": { "External id": 24206,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046789.951, "dur": 0.061, "args": { "External id": 24207,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046790.262, "dur": 0.050, "args": { "External id": 24208,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046791.050, "dur": 0.067, "args": { "External id": 24209,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046791.360, "dur": 0.049, "args": { "External id": 24210,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046792.059, "dur": 0.054, "args": { "External id": 24211,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046792.354, "dur": 0.052, "args": { "External id": 24212,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046792.917, "dur": 0.054, "args": { "External id": 24213,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046793.212, "dur": 0.053, "args": { "External id": 24214,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046794.139, "dur": 0.064, "args": { "External id": 24215,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046794.460, "dur": 0.052, "args": { "External id": 24216,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046795.840, "dur": 0.065, "args": { "External id": 24217,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046796.172, "dur": 0.050, "args": { "External id": 24218,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046796.885, "dur": 0.067, "args": { "External id": 24219,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046797.231, "dur": 0.052, "args": { "External id": 24220,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046797.979, "dur": 0.070, "args": { "External id": 24221,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046798.305, "dur": 0.051, "args": { "External id": 24222,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046799.098, "dur": 0.053, "args": { "External id": 24223,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046799.412, "dur": 0.050, "args": { "External id": 24224,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046799.986, "dur": 0.065, "args": { "External id": 24225,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046800.307, "dur": 0.054, "args": { "External id": 24226,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046800.851, "dur": 0.068, "args": { "External id": 24227,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046801.174, "dur": 0.049, "args": { "External id": 24228,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046801.718, "dur": 0.060, "args": { "External id": 24229,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046802.034, "dur": 0.057, "args": { "External id": 24230,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046802.857, "dur": 0.062, "args": { "External id": 24231,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046803.175, "dur": 0.051, "args": { "External id": 24232,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046803.740, "dur": 0.067, "args": { "External id": 24233,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046804.065, "dur": 0.040, "args": { "External id": 24234,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046804.612, "dur": 0.061, "args": { "External id": 24235,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046804.928, "dur": 0.051, "args": { "External id": 24236,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046805.552, "dur": 0.061, "args": { "External id": 24237,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046805.872, "dur": 0.050, "args": { "External id": 24238,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046806.508, "dur": 0.060, "args": { "External id": 24239,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046806.832, "dur": 0.054, "args": { "External id": 24240,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046807.538, "dur": 0.062, "args": { "External id": 24241,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046807.870, "dur": 0.050, "args": { "External id": 24242,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046808.761, "dur": 0.046, "args": { "External id": 24243,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046809.063, "dur": 0.043, "args": { "External id": 24244,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046809.896, "dur": 0.060, "args": { "External id": 24245,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046810.211, "dur": 0.048, "args": { "External id": 24246,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046810.778, "dur": 0.052, "args": { "External id": 24247,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046811.080, "dur": 0.046, "args": { "External id": 24248,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046811.635, "dur": 0.068, "args": { "External id": 24249,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046811.962, "dur": 0.051, "args": { "External id": 24250,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046812.515, "dur": 0.065, "args": { "External id": 24251,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046812.837, "dur": 0.049, "args": { "External id": 24252,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046813.447, "dur": 0.059, "args": { "External id": 24253,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046813.763, "dur": 0.048, "args": { "External id": 24254,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046814.473, "dur": 0.067, "args": { "External id": 24255,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046814.798, "dur": 0.046, "args": { "External id": 24256,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046815.532, "dur": 0.066, "args": { "External id": 24257,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046815.850, "dur": 0.052, "args": { "External id": 24258,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046816.576, "dur": 0.063, "args": { "External id": 24259,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046816.894, "dur": 0.046, "args": { "External id": 24260,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046817.669, "dur": 0.062, "args": { "External id": 24261,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046817.986, "dur": 0.052, "args": { "External id": 24262,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046818.521, "dur": 0.065, "args": { "External id": 24263,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046818.845, "dur": 0.051, "args": { "External id": 24264,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046819.537, "dur": 0.065, "args": { "External id": 24265,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046819.881, "dur": 0.056, "args": { "External id": 24266,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046820.475, "dur": 0.066, "args": { "External id": 24267,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046820.792, "dur": 0.050, "args": { "External id": 24268,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046821.323, "dur": 0.059, "args": { "External id": 24269,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046821.633, "dur": 0.051, "args": { "External id": 24270,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046822.204, "dur": 0.054, "args": { "External id": 24271,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046822.520, "dur": 0.048, "args": { "External id": 24272,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046823.246, "dur": 0.071, "args": { "External id": 24273,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046823.571, "dur": 0.050, "args": { "External id": 24274,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046824.368, "dur": 0.046, "args": { "External id": 24275,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046824.671, "dur": 0.057, "args": { "External id": 24276,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046825.429, "dur": 0.065, "args": { "External id": 24277,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046825.744, "dur": 0.052, "args": { "External id": 24278,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046826.484, "dur": 0.057, "args": { "External id": 24279,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046826.824, "dur": 0.046, "args": { "External id": 24280,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336757, "tid": 1336757, "ts": 1295652046827.523, "dur": 0.067, "args": { "External id": 24281,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_fused_adamw_", "pid": 1336757, "tid": 1336757, "ts": 1295652047480.306, "dur": 3847.463, "args": { "External id": 24282,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "0.0001023488255872064", "0.90000000000000002", "0.94999999999999996", "0.10000000000000001", "1.0000000000000001e-15", "False", "False", "", ""], "Input type": ["TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 11633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_fused_adamw_", "pid": 1336757, "tid": 1336757, "ts": 1295652050744.331, "dur": 384.266, "args": { "External id": 24283,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "0.0001023488255872064", "0.90000000000000002", "0.94999999999999996", "0.10000000000000001", "1.0000000000000001e-15", "False", "False", "", ""], "Input type": ["TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 11634 } }, { "name": "process_name", "ph": "M", "ts": 1295649886893.277, "pid": 1336757, "tid": 0, "args": { "name": "python3.12" } }, { "name": "process_labels", "ph": "M", "ts": 1295649886893.277, "pid": 1336757, "tid": 0, "args": { "labels": "CPU" } }, { "name": "process_sort_index", "ph": "M", "ts": 1295649886893.277, "pid": 1336757, "tid": 0, "args": { "sort_index": 1336757 } }, { "name": "thread_name", "ph": "M", "ts": 1295649886893.277, "pid": 1336757, "tid": 1381170, "args": { "name": "thread 1381170 (pt_autograd_4)" } }, { "name": "thread_sort_index", "ph": "M", "ts": 1295649886893.277, "pid": 1336757, "tid": 1381170, "args": { "sort_index": 1381170 } }, { "name": "thread_name", "ph": "M", "ts": 1295649886893.277, "pid": 1336757, "tid": 1336757, "args": { "name": "thread 1336757 (python3.12)" } }, { "name": "thread_sort_index", "ph": "M", "ts": 1295649886893.277, "pid": 1336757, "tid": 1336757, "args": { "sort_index": 1336757 } }, { "name": "thread_name", "ph": "M", "ts": 1295649886893.277, "pid": 1336757, "tid": 1381170, "args": { "name": "thread 1381170 (python3.12)" } }, { "name": "thread_sort_index", "ph": "M", "ts": 1295649886893.277, "pid": 1336757, "tid": 1381170, "args": { "sort_index": 1381170 } }, { "ph": "X", "cat": "Trace", "ts": 1295649886827.411, "dur": 2166235.550, "pid": "Spans", "tid": "PyTorch Profiler", "name": "PyTorch Profiler (0)", "args": { "Op count": 0 } }, { "name": "process_sort_index", "ph": "M", "ts": 1295649886827.411, "pid": "Spans", "tid": 0, "args": { "sort_index": 536870912 } }, { "name": "Iteration Start: PyTorch Profiler", "ph": "i", "s": "g", "pid": "Traces", "tid": "Trace PyTorch Profiler", "ts": 1295649886827.411 }, { "name": "Record Window End", "ph": "i", "s": "g", "pid": "", "tid": "", "ts": 1295652116571.991 } ], "traceName": "exp/mtp.1B.batch16.seqlen4096.context4096.warmup2000.update1.steps200000.lr2e-4.cosine/profile_trace/iteration_1024/rank4_trace.json", "displayTimeUnit": "ms", "baseTimeNanoseconds": 1751410836000000000 }